diff --git a/.ipynb_checkpoints/cheese-checkpoint.ipynb b/.ipynb_checkpoints/cheese-checkpoint.ipynb new file mode 100644 index 0000000..88c8de1 --- /dev/null +++ b/.ipynb_checkpoints/cheese-checkpoint.ipynb @@ -0,0 +1,3846 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "5f7c9658-c285-4854-96c0-e899fc55421b", + "metadata": {}, + "source": [ + "# DM project: cheese" + ] + }, + { + "cell_type": "code", + "execution_count": 43, + "id": "7f4f2b89-8257-468c-9f5e-a77e11b8b8ff", + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "from mlxtend.preprocessing import TransactionEncoder\n", + "from mlxtend.frequent_patterns import apriori\n", + "from geopy.geocoders import Nominatim\n", + "import matplotlib.pyplot as plt\n", + "import time\n", + "import tqdm.notebook as tqdm\n", + "import random\n" + ] + }, + { + "cell_type": "code", + "execution_count": 44, + "id": "1a0afba8-692b-4377-a2ce-5114983e3bbb", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | cheese | \n", + "url | \n", + "milk | \n", + "country | \n", + "region | \n", + "family | \n", + "type | \n", + "fat_content | \n", + "calcium_content | \n", + "texture | \n", + "rind | \n", + "color | \n", + "flavor | \n", + "aroma | \n", + "vegetarian | \n", + "vegan | \n", + "synonyms | \n", + "alt_spellings | \n", + "producers | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "Aarewasser | \n", + "https://www.cheese.com/aarewasser/ | \n", + "cow | \n", + "Switzerland | \n", + "NaN | \n", + "NaN | \n", + "semi-soft | \n", + "NaN | \n", + "NaN | \n", + "buttery | \n", + "washed | \n", + "yellow | \n", + "sweet | \n", + "buttery | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "Jumi | \n", + "
1 | \n", + "Abbaye de Belloc | \n", + "https://www.cheese.com/abbaye-de-belloc/ | \n", + "sheep | \n", + "France | \n", + "Pays Basque | \n", + "NaN | \n", + "semi-hard, artisan | \n", + "NaN | \n", + "NaN | \n", + "creamy, dense, firm | \n", + "natural | \n", + "yellow | \n", + "burnt caramel | \n", + "lanoline | \n", + "True | \n", + "False | \n", + "Abbaye Notre-Dame de Belloc | \n", + "NaN | \n", + "NaN | \n", + "
2 | \n", + "Abbaye de Belval | \n", + "https://www.cheese.com/abbaye-de-belval/ | \n", + "cow | \n", + "France | \n", + "NaN | \n", + "NaN | \n", + "semi-hard | \n", + "40-46% | \n", + "NaN | \n", + "elastic | \n", + "washed | \n", + "ivory | \n", + "NaN | \n", + "aromatic | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
3 | \n", + "Abbaye de Citeaux | \n", + "https://www.cheese.com/abbaye-de-citeaux/ | \n", + "cow | \n", + "France | \n", + "Burgundy | \n", + "NaN | \n", + "semi-soft, artisan, brined | \n", + "NaN | \n", + "NaN | \n", + "creamy, dense, smooth | \n", + "washed | \n", + "white | \n", + "acidic, milky, smooth | \n", + "barnyardy, earthy | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
4 | \n", + "Abbaye de Tamié | \n", + "https://www.cheese.com/tamie/ | \n", + "cow | \n", + "France | \n", + "Savoie | \n", + "NaN | \n", + "soft, artisan | \n", + "NaN | \n", + "NaN | \n", + "creamy, open, smooth | \n", + "washed | \n", + "white | \n", + "fruity, nutty | \n", + "perfumed, pungent | \n", + "False | \n", + "False | \n", + "NaN | \n", + "Tamié, Trappiste de Tamie, Abbey of Tamie | \n", + "NaN | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
1182 | \n", + "Sveciaost | \n", + "https://www.cheese.com/sveciaost/ | \n", + "cow | \n", + "Sweden | \n", + "Low-laying regions | \n", + "NaN | \n", + "semi-hard, brined | \n", + "45% | \n", + "NaN | \n", + "creamy, supple | \n", + "rindless | \n", + "pale yellow | \n", + "acidic | \n", + "NaN | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
1183 | \n", + "Swag | \n", + "https://www.cheese.com/swag/ | \n", + "goat | \n", + "Australia | \n", + "South Australia | \n", + "NaN | \n", + "fresh firm, artisan | \n", + "NaN | \n", + "NaN | \n", + "creamy, crumbly | \n", + "ash coated | \n", + "white | \n", + "acidic, creamy | \n", + "fresh | \n", + "True | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "Woodside Cheese Wrights | \n", + "
1184 | \n", + "Swaledale | \n", + "https://www.cheese.com/swaledale/ | \n", + "sheep | \n", + "England | \n", + "Swaledale, North Yorkshire | \n", + "NaN | \n", + "hard | \n", + "NaN | \n", + "NaN | \n", + "semi firm | \n", + "NaN | \n", + "yellow | \n", + "smooth, sweet | \n", + "floral | \n", + "True | \n", + "False | \n", + "Swaledale Sheep Cheese | \n", + "NaN | \n", + "NaN | \n", + "
1185 | \n", + "Sweet Style Swiss | \n", + "https://www.cheese.com/sweet-style-swiss/ | \n", + "NaN | \n", + "Switzerland | \n", + "NaN | \n", + "NaN | \n", + "semi-hard, artisan | \n", + "NaN | \n", + "NaN | \n", + "firm, supple | \n", + "waxed | \n", + "NaN | \n", + "nutty | \n", + "nutty, sweet | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
1186 | \n", + "Swiss cheese | \n", + "https://www.cheese.com/swiss/ | \n", + "cow | \n", + "United States | \n", + "NaN | \n", + "Swiss Cheese | \n", + "hard, artisan, processed | \n", + "7.8 g/100g | \n", + "NaN | \n", + "firm | \n", + "rindless | \n", + "pale yellow | \n", + "nutty, sweet | \n", + "NaN | \n", + "True | \n", + "False | \n", + "American Swiss Cheese | \n", + "NaN | \n", + "Various | \n", + "
1187 rows × 19 columns
\n", + "\n", + " | cheese | \n", + "url | \n", + "milk | \n", + "country | \n", + "region | \n", + "family | \n", + "type | \n", + "fat_content | \n", + "calcium_content | \n", + "texture | \n", + "rind | \n", + "color | \n", + "flavor | \n", + "aroma | \n", + "vegetarian | \n", + "vegan | \n", + "synonyms | \n", + "alt_spellings | \n", + "producers | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
10 | \n", + "Acapella | \n", + "https://www.cheese.com/acapella/ | \n", + "goat | \n", + "United States | \n", + "California | \n", + "NaN | \n", + "soft, soft-ripened | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "buttery | \n", + "fresh, herbal | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
13 | \n", + "Acorn | \n", + "https://www.cheese.com/acorn/ | \n", + "sheep | \n", + "United Kingdom | \n", + "Bethania | \n", + "NaN | \n", + "hard, artisan | \n", + "52% | \n", + "NaN | \n", + "crumbly, firm | \n", + "NaN | \n", + "NaN | \n", + "burnt caramel, citrusy, herbaceous | \n", + "fruity | \n", + "True | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
19 | \n", + "Afuega'l Pitu | \n", + "https://www.cheese.com/afuegal-pitu/ | \n", + "cow | \n", + "Spain | \n", + "Asturias | \n", + "NaN | \n", + "soft, artisan | \n", + "NaN | \n", + "NaN | \n", + "smooth | \n", + "cloth wrapped | \n", + "NaN | \n", + "spicy, strong | \n", + "NaN | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
48 | \n", + "Alpe di Frabosa | \n", + "https://www.cheese.com/alpe-di-frabosa/ | \n", + "cow | \n", + "Italy | \n", + "NaN | \n", + "NaN | \n", + "semi-soft | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "bitter | \n", + "milky, mushroom | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
50 | \n", + "Alpicrème | \n", + "https://www.cheese.com/alpicreme/ | \n", + "goat | \n", + "France | \n", + "NaN | \n", + "NaN | \n", + "soft | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
1172 | \n", + "Strathdon Blue | \n", + "https://www.cheese.com/strathdon-blue/ | \n", + "cow | \n", + "Scotland | \n", + "Tain | \n", + "Blue | \n", + "semi-soft | \n", + "NaN | \n", + "NaN | \n", + "creamy | \n", + "NaN | \n", + "NaN | \n", + "creamy, spicy | \n", + "aromatic, rich | \n", + "True | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "Highland Fine Cheeses Limited | \n", + "
1175 | \n", + "String Cheese | \n", + "https://www.cheese.com/string/ | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "semi-hard | \n", + "NaN | \n", + "NaN | \n", + "chewy, firm, stringy | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
1177 | \n", + "Sulguni | \n", + "https://www.cheese.com/sulguni/ | \n", + "buffalo, cow | \n", + "Georgia | \n", + "Svaneti, Samegrelo | \n", + "NaN | \n", + "semi-firm | \n", + "NaN | \n", + "NaN | \n", + "dense, elastic | \n", + "NaN | \n", + "NaN | \n", + "salty, smokey , sour | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "Georgian Pickle Cheese | \n", + "Megruli Sulguni, Shebolili Megruli Sulguni | \n", + "NaN | \n", + "
1181 | \n", + "Sussex Slipcote | \n", + "https://www.cheese.com/sussex-slipcote/ | \n", + "sheep | \n", + "England | \n", + "NaN | \n", + "NaN | \n", + "soft | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "sharp | \n", + "NaN | \n", + "True | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "High Weald Dairy | \n", + "
1185 | \n", + "Sweet Style Swiss | \n", + "https://www.cheese.com/sweet-style-swiss/ | \n", + "NaN | \n", + "Switzerland | \n", + "NaN | \n", + "NaN | \n", + "semi-hard, artisan | \n", + "NaN | \n", + "NaN | \n", + "firm, supple | \n", + "waxed | \n", + "NaN | \n", + "nutty | \n", + "nutty, sweet | \n", + "False | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
142 rows × 19 columns
\n", + "\n", + " | cheese | \n", + "milk | \n", + "country | \n", + "region | \n", + "family | \n", + "type | \n", + "texture | \n", + "rind | \n", + "color | \n", + "flavor | \n", + "aroma | \n", + "vegetarian | \n", + "vegan | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "Aarewasser | \n", + "cow | \n", + "Switzerland | \n", + "NaN | \n", + "NaN | \n", + "semi-soft | \n", + "buttery | \n", + "washed | \n", + "yellow | \n", + "sweet | \n", + "buttery | \n", + "False | \n", + "False | \n", + "
1 | \n", + "Abbaye de Belloc | \n", + "sheep | \n", + "France | \n", + "Pays Basque | \n", + "NaN | \n", + "semi-hard, artisan | \n", + "creamy, dense, firm | \n", + "natural | \n", + "yellow | \n", + "burnt caramel | \n", + "lanoline | \n", + "True | \n", + "False | \n", + "
2 | \n", + "Abbaye de Belval | \n", + "cow | \n", + "France | \n", + "NaN | \n", + "NaN | \n", + "semi-hard | \n", + "elastic | \n", + "washed | \n", + "ivory | \n", + "NaN | \n", + "aromatic | \n", + "False | \n", + "False | \n", + "
3 | \n", + "Abbaye de Citeaux | \n", + "cow | \n", + "France | \n", + "Burgundy | \n", + "NaN | \n", + "semi-soft, artisan, brined | \n", + "creamy, dense, smooth | \n", + "washed | \n", + "white | \n", + "acidic, milky, smooth | \n", + "barnyardy, earthy | \n", + "False | \n", + "False | \n", + "
4 | \n", + "Abbaye de Tamié | \n", + "cow | \n", + "France | \n", + "Savoie | \n", + "NaN | \n", + "soft, artisan | \n", + "creamy, open, smooth | \n", + "washed | \n", + "white | \n", + "fruity, nutty | \n", + "perfumed, pungent | \n", + "False | \n", + "False | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
1182 | \n", + "Sveciaost | \n", + "cow | \n", + "Sweden | \n", + "Low-laying regions | \n", + "NaN | \n", + "semi-hard, brined | \n", + "creamy, supple | \n", + "rindless | \n", + "pale yellow | \n", + "acidic | \n", + "NaN | \n", + "False | \n", + "False | \n", + "
1183 | \n", + "Swag | \n", + "goat | \n", + "Australia | \n", + "South Australia | \n", + "NaN | \n", + "fresh firm, artisan | \n", + "creamy, crumbly | \n", + "ash coated | \n", + "white | \n", + "acidic, creamy | \n", + "fresh | \n", + "True | \n", + "False | \n", + "
1184 | \n", + "Swaledale | \n", + "sheep | \n", + "England | \n", + "Swaledale, North Yorkshire | \n", + "NaN | \n", + "hard | \n", + "semi firm | \n", + "NaN | \n", + "yellow | \n", + "smooth, sweet | \n", + "floral | \n", + "True | \n", + "False | \n", + "
1185 | \n", + "Sweet Style Swiss | \n", + "NaN | \n", + "Switzerland | \n", + "NaN | \n", + "NaN | \n", + "semi-hard, artisan | \n", + "firm, supple | \n", + "waxed | \n", + "NaN | \n", + "nutty | \n", + "nutty, sweet | \n", + "False | \n", + "False | \n", + "
1186 | \n", + "Swiss cheese | \n", + "cow | \n", + "United States | \n", + "NaN | \n", + "Swiss Cheese | \n", + "hard, artisan, processed | \n", + "firm | \n", + "rindless | \n", + "pale yellow | \n", + "nutty, sweet | \n", + "NaN | \n", + "True | \n", + "False | \n", + "
1187 rows × 13 columns
\n", + "\n", + " | cheese | \n", + "milk | \n", + "country | \n", + "region | \n", + "family | \n", + "type | \n", + "texture | \n", + "rind | \n", + "color | \n", + "flavor | \n", + "aroma | \n", + "vegetarian | \n", + "vegan | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
12 | \n", + "Ackawi | \n", + "cow, goat, sheep | \n", + "Cyprus, Egypt, Israel, Jordan, Lebanon, Middle... | \n", + "+ | \n", + "Feta | \n", + "soft, brined | \n", + "elastic, smooth, springy | \n", + "natural | \n", + "white | \n", + "mild, milky, salty | \n", + "mild, milky | \n", + "False | \n", + "False | \n", + "
116 | \n", + "Baladi | \n", + "cow, goat, sheep | \n", + "Lebanon, Middle East | \n", + "\n", + " | NaN | \n", + "fresh soft, artisan | \n", + "creamy, dense, smooth | \n", + "rindless | \n", + "white | \n", + "buttery, mild, salty, sweet | \n", + "fresh | \n", + "False | \n", + "False | \n", + "
160 | \n", + "Beemster 2% Milk | \n", + "cow | \n", + "Canada, Denmark, France, Germany, Netherlands,... | \n", + "\n", + " | NaN | \n", + "semi-soft | \n", + "smooth | \n", + "NaN | \n", + "NaN | \n", + "nutty | \n", + "aromatic, floral, fruity | \n", + "False | \n", + "False | \n", + "
212 | \n", + "Blissful Blocks | \n", + "NaN | \n", + "Canada, United States | \n", + "\n", + " | Cheddar | \n", + "hard | \n", + "creamy, crumbly | \n", + "plastic | \n", + "yellow | \n", + "creamy, savory, sharp, spicy | \n", + "NaN | \n", + "True | \n", + "False | \n", + "
213 | \n", + "Blissful Toppings | \n", + "NaN | \n", + "Canada, United States | \n", + "\n", + " | Parmesan | \n", + "soft | \n", + "crumbly | \n", + "artificial | \n", + "yellow | \n", + "savory, sharp | \n", + "NaN | \n", + "True | \n", + "False | \n", + "
243 | \n", + "Bootlegger | \n", + "cow, sheep | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "NaN | \n", + "hard, artisan | \n", + "crumbly, firm | \n", + "natural | \n", + "pale yellow | \n", + "fruity, full-flavored, strong | \n", + "floral | \n", + "NaN | \n", + "NaN | \n", + "
262 | \n", + "Brebis d'Azure | \n", + "sheep | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "Blue | \n", + "semi-hard, artisan, blue-veined | \n", + "soft | \n", + "natural | \n", + "pale yellow | \n", + "sharp | \n", + "aromatic | \n", + "NaN | \n", + "NaN | \n", + "
297 | \n", + "Brunost | \n", + "cow, goat | \n", + "Denmark, Finland, Germany, Iceland, Norway, Sw... | \n", + "\n", + " | NaN | \n", + "semi-soft, whey | \n", + "dense | \n", + "natural | \n", + "brown | \n", + "caramel, sweet | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
300 | \n", + "Bryndza | \n", + "sheep | \n", + "Hungary, Poland, Slovakia | \n", + "\n", + " | NaN | \n", + "soft, artisan | \n", + "spreadable | \n", + "rindless | \n", + "white | \n", + "mild, salty | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
311 | \n", + "Burrata | \n", + "water buffalo | \n", + "Italy, United States | \n", + "Apulia | \n", + "Mozzarella | \n", + "fresh soft, artisan | \n", + "creamy, stringy | \n", + "leaf wrapped | \n", + "white | \n", + "buttery, milky | \n", + "fresh, milky | \n", + "False | \n", + "False | \n", + "
316 | \n", + "Butterkase | \n", + "cow | \n", + "Austria, Germany | \n", + "\n", + " | NaN | \n", + "semi-soft | \n", + "creamy, smooth, spreadable | \n", + "natural | \n", + "pale yellow | \n", + "buttery, mild | \n", + "NaN | \n", + "False | \n", + "False | \n", + "
367 | \n", + "Cap Cressy | \n", + "goat | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "NaN | \n", + "semi-hard, artisan, smear-ripened | \n", + "compact, dense | \n", + "washed | \n", + "pale yellow | \n", + "mellow, savory, sweet | \n", + "lactic | \n", + "NaN | \n", + "NaN | \n", + "
375 | \n", + "Capri Blu | \n", + "goat | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "Blue | \n", + "soft, blue-veined | \n", + "creamy, soft | \n", + "natural | \n", + "pale yellow | \n", + "creamy, subtle, sweet | \n", + "goaty | \n", + "NaN | \n", + "NaN | \n", + "
377 | \n", + "Caprice | \n", + "goat | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "NaN | \n", + "soft | \n", + "creamy, smooth | \n", + "natural | \n", + "white | \n", + "subtle | \n", + "goaty | \n", + "NaN | \n", + "NaN | \n", + "
407 | \n", + "Casu marzu | \n", + "sheep | \n", + "France, Italy | \n", + "Sardinia (Italy), Southern Corsica (France) | \n", + "NaN | \n", + "soft, soft-ripened | \n", + "soft-ripened | \n", + "natural | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
437 | \n", + "Cheese Curds | \n", + "NaN | \n", + "Canada, India, United States | \n", + "\n", + " | Cheddar | \n", + "fresh firm | \n", + "firm, springy | \n", + "natural | \n", + "white | \n", + "mild, milky | \n", + "fresh | \n", + "NaN | \n", + "NaN | \n", + "
445 | \n", + "Chhurpi | \n", + "cow, yak | \n", + "China, Nepal, Tibet | \n", + "\n", + " | Cottage | \n", + "soft, hard, artisan | \n", + "dense | \n", + "natural | \n", + "pale yellow | \n", + "tangy | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
455 | \n", + "Chura Kampo | \n", + "yak | \n", + "China, Tibet | \n", + "Tibet | \n", + "NaN | \n", + "hard, artisan | \n", + "dense, dry, firm | \n", + "natural | \n", + "NaN | \n", + "NaN | \n", + "aromatic | \n", + "NaN | \n", + "NaN | \n", + "
508 | \n", + "Cottage Cheese | \n", + "cow | \n", + "United Kingdom, United States | \n", + "\n", + " | Cottage | \n", + "soft, artisan, processed | \n", + "creamy, crumbly | \n", + "rindless | \n", + "white | \n", + "sweet | \n", + "NaN | \n", + "True | \n", + "False | \n", + "
512 | \n", + "Counting Sheep…and Goats... | \n", + "cow, goat, sheep | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "NaN | \n", + "soft, soft-ripened | \n", + "creamy, soft | \n", + "NaN | \n", + "white | \n", + "creamy, subtle, sweet | \n", + "nutty | \n", + "NaN | \n", + "NaN | \n", + "
524 | \n", + "Cream Cheesy Bliss | \n", + "NaN | \n", + "Canada, United States | \n", + "\n", + " | NaN | \n", + "soft | \n", + "creamy, spreadable | \n", + "artificial | \n", + "white | \n", + "creamy, garlicky, herbaceous, sweet | \n", + "rich | \n", + "True | \n", + "False | \n", + "
537 | \n", + "Cressy Blu | \n", + "cow | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "Blue | \n", + "semi-hard, blue-veined | \n", + "creamy, crumbly, firm | \n", + "natural | \n", + "pale yellow | \n", + "creamy, savory, sweet | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
569 | \n", + "La Couronne - Fort Aged Comté | \n", + "cow | \n", + "France, Switzerland | \n", + "Franche Comté | \n", + "NaN | \n", + "semi-hard | \n", + "dense | \n", + "NaN | \n", + "pale yellow | \n", + "caramel, nutty, sweet | \n", + "rich | \n", + "NaN | \n", + "NaN | \n", + "
601 | \n", + "Lamb Chopper | \n", + "sheep | \n", + "Netherlands, United States | \n", + "California | \n", + "Gouda | \n", + "hard | \n", + "dense, firm, smooth | \n", + "waxed | \n", + "ivory | \n", + "buttery, caramel, creamy, nutty, sweet | \n", + "mild, sweet | \n", + "True | \n", + "False | \n", + "
621 | \n", + "Le Conquerant Demi Pont L'eveque | \n", + "cow | \n", + "Australia, France | \n", + "\n", + " | NaN | \n", + "soft, artisan | \n", + "chalky, creamy, soft | \n", + "washed | \n", + "NaN | \n", + "creamy, mild | \n", + "pungent | \n", + "NaN | \n", + "NaN | \n", + "
646 | \n", + "Limburger | \n", + "cow | \n", + "Belgium, Germany, Netherlands | \n", + "Duchy of Limburg | \n", + "NaN | \n", + "semi-soft, smear-ripened | \n", + "crumbly, firm, smooth | \n", + "washed | \n", + "straw | \n", + "grassy, mild, mushroomy | \n", + "stinky | \n", + "False | \n", + "False | \n", + "
675 | \n", + "Lunetta | \n", + "cow | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "NaN | \n", + "fresh soft, artisan | \n", + "creamy | \n", + "natural | \n", + "white | \n", + "creamy, salty | \n", + "aromatic, fresh | \n", + "NaN | \n", + "NaN | \n", + "
701 | \n", + "Mamirolle | \n", + "cow | \n", + "Canada, France | \n", + "Plessisville, Quebec | \n", + "NaN | \n", + "semi-soft, artisan | \n", + "chewy, supple | \n", + "washed | \n", + "ivory | \n", + "buttery, fruity, salty, sweet | \n", + "earthy, pungent | \n", + "False | \n", + "False | \n", + "
776 | \n", + "Monastery Cheeses | \n", + "cow | \n", + "Belgium, Canada, France, Switzerland, United S... | \n", + "\n", + " | NaN | \n", + "soft, semi-soft, brined | \n", + "chalky, creamy, firm, grainy | \n", + "washed | \n", + "golden yellow | \n", + "mild, pungent | \n", + "pungent, strong | \n", + "False | \n", + "False | \n", + "
789 | \n", + "Monterey Jack | \n", + "cow | \n", + "Mexico, United States | \n", + "Monterey, California | \n", + "Monterey Jack | \n", + "semi-hard | \n", + "compact, creamy, firm, open, supple | \n", + "NaN | \n", + "pale yellow | \n", + "buttery, mild | \n", + "aromatic | \n", + "NaN | \n", + "NaN | \n", + "
852 | \n", + "Paneer | \n", + "cow, water buffalo | \n", + "Bangladesh, India | \n", + "\n", + " | Cottage | \n", + "fresh firm | \n", + "crumbly, firm | \n", + "rindless | \n", + "white | \n", + "milky | \n", + "fresh, milky | \n", + "True | \n", + "False | \n", + "
975 | \n", + "President Fat Free Feta | \n", + "cow | \n", + "France, United States | \n", + "New York | \n", + "Feta | \n", + "firm, artisan, brined | \n", + "crumbly | \n", + "natural | \n", + "white | \n", + "herbaceous, salty, tangy | \n", + "fresh | \n", + "NaN | \n", + "NaN | \n", + "
1001 | \n", + "Purple's a Must | \n", + "cow, goat | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "Blue | \n", + "semi-hard, artisan, blue-veined | \n", + "creamy, crumbly | \n", + "mold ripened | \n", + "pale yellow | \n", + "full-flavored, strong | \n", + "rich | \n", + "NaN | \n", + "NaN | \n", + "
1082 | \n", + "Shanklish | \n", + "cow, sheep | \n", + "Egypt, Lebanon, Syria | \n", + "\n", + " | Feta | \n", + "fresh firm, hard, artisan | \n", + "creamy, crumbly, firm | \n", + "mold ripened | \n", + "white | \n", + "sharp, spicy, strong | \n", + "pungent, strong | \n", + "False | \n", + "False | \n", + "
1099 | \n", + "Shredded Bliss | \n", + "NaN | \n", + "Canada, United States | \n", + "\n", + " | Mozzarella | \n", + "semi-soft | \n", + "elastic, smooth, springy, stringy | \n", + "plastic | \n", + "pale yellow | \n", + "mild, milky | \n", + "fresh, mild | \n", + "True | \n", + "False | \n", + "
1106 | \n", + "Sirene | \n", + "cow, goat, sheep | \n", + "Albania, Bulgaria, Croatia, Greece, Israel, Ma... | \n", + "Trakia | \n", + "Feta | \n", + "fresh soft, brined | \n", + "crumbly, grainy, smooth | \n", + "natural | \n", + "white | \n", + "lemony, salty, sharp, tangy | \n", + "strong | \n", + "False | \n", + "False | \n", + "
1108 | \n", + "Slices Of Bliss | \n", + "NaN | \n", + "Canada, United States | \n", + "\n", + " | Cheddar | \n", + "soft | \n", + "creamy | \n", + "plastic | \n", + "yellow | \n", + "creamy, savory, sharp, spicy | \n", + "NaN | \n", + "True | \n", + "False | \n", + "
1123 | \n", + "Sosha | \n", + "goat, yak | \n", + "China, Nepal, Tibet | \n", + "Tibet | \n", + "NaN | \n", + "soft, artisan | \n", + "creamy | \n", + "natural | \n", + "white | \n", + "pungent, strong | \n", + "pungent, strong | \n", + "NaN | \n", + "NaN | \n", + "
1173 | \n", + "Strawberry Moon | \n", + "cow | \n", + "Canada, Italy | \n", + "Lombardy | \n", + "NaN | \n", + "semi-hard, artisan, smear-ripened | \n", + "compact, creamy, dense | \n", + "washed | \n", + "straw | \n", + "subtle, sweet | \n", + "strong | \n", + "NaN | \n", + "NaN | \n", + "
\n", + " | cheese | \n", + "milk | \n", + "country | \n", + "region | \n", + "family | \n", + "type | \n", + "texture | \n", + "rind | \n", + "color | \n", + "flavor | \n", + "aroma | \n", + "vegetarian | \n", + "vegan | \n", + "location | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "Aarewasser | \n", + "cow | \n", + "Switzerland | \n", + "\n", + " | NaN | \n", + "semi-soft | \n", + "buttery | \n", + "washed | \n", + "yellow | \n", + "sweet | \n", + "buttery | \n", + "False | \n", + "False | \n", + ", Switzerland | \n", + "
1 | \n", + "Abbaye de Belloc | \n", + "sheep | \n", + "France | \n", + "Pays Basque | \n", + "NaN | \n", + "semi-hard, artisan | \n", + "creamy, dense, firm | \n", + "natural | \n", + "yellow | \n", + "burnt caramel | \n", + "lanoline | \n", + "True | \n", + "False | \n", + "Pays Basque, France | \n", + "
2 | \n", + "Abbaye de Belval | \n", + "cow | \n", + "France | \n", + "\n", + " | NaN | \n", + "semi-hard | \n", + "elastic | \n", + "washed | \n", + "ivory | \n", + "NaN | \n", + "aromatic | \n", + "False | \n", + "False | \n", + ", France | \n", + "
3 | \n", + "Abbaye de Citeaux | \n", + "cow | \n", + "France | \n", + "Burgundy | \n", + "NaN | \n", + "semi-soft, artisan, brined | \n", + "creamy, dense, smooth | \n", + "washed | \n", + "white | \n", + "acidic, milky, smooth | \n", + "barnyardy, earthy | \n", + "False | \n", + "False | \n", + "Burgundy, France | \n", + "
4 | \n", + "Abbaye de Tamié | \n", + "cow | \n", + "France | \n", + "Savoie | \n", + "NaN | \n", + "soft, artisan | \n", + "creamy, open, smooth | \n", + "washed | \n", + "white | \n", + "fruity, nutty | \n", + "perfumed, pungent | \n", + "False | \n", + "False | \n", + "Savoie, France | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
1182 | \n", + "Sveciaost | \n", + "cow | \n", + "Sweden | \n", + "Low-laying regions | \n", + "NaN | \n", + "semi-hard, brined | \n", + "creamy, supple | \n", + "rindless | \n", + "pale yellow | \n", + "acidic | \n", + "NaN | \n", + "False | \n", + "False | \n", + "Low-laying regions, Sweden | \n", + "
1183 | \n", + "Swag | \n", + "goat | \n", + "Australia | \n", + "South Australia | \n", + "NaN | \n", + "fresh firm, artisan | \n", + "creamy, crumbly | \n", + "ash coated | \n", + "white | \n", + "acidic, creamy | \n", + "fresh | \n", + "True | \n", + "False | \n", + "South Australia, Australia | \n", + "
1184 | \n", + "Swaledale | \n", + "sheep | \n", + "England | \n", + "Swaledale, North Yorkshire | \n", + "NaN | \n", + "hard | \n", + "semi firm | \n", + "NaN | \n", + "yellow | \n", + "smooth, sweet | \n", + "floral | \n", + "True | \n", + "False | \n", + "Swaledale, North Yorkshire, England | \n", + "
1185 | \n", + "Sweet Style Swiss | \n", + "NaN | \n", + "Switzerland | \n", + "\n", + " | NaN | \n", + "semi-hard, artisan | \n", + "firm, supple | \n", + "waxed | \n", + "NaN | \n", + "nutty | \n", + "nutty, sweet | \n", + "False | \n", + "False | \n", + ", Switzerland | \n", + "
1186 | \n", + "Swiss cheese | \n", + "cow | \n", + "United States | \n", + "\n", + " | Swiss Cheese | \n", + "hard, artisan, processed | \n", + "firm | \n", + "rindless | \n", + "pale yellow | \n", + "nutty, sweet | \n", + "NaN | \n", + "True | \n", + "False | \n", + ", United States | \n", + "
1142 rows × 14 columns
\n", + "\n", - " | cheese | \n", - "url | \n", - "milk | \n", - "country | \n", - "region | \n", - "family | \n", - "type | \n", - "fat_content | \n", - "calcium_content | \n", - "texture | \n", - "rind | \n", - "color | \n", - "flavor | \n", - "aroma | \n", - "vegetarian | \n", - "vegan | \n", - "synonyms | \n", - "alt_spellings | \n", - "producers | \n", - "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
10 | \n", - "Acapella | \n", - "https://www.cheese.com/acapella/ | \n", - "goat | \n", - "United States | \n", - "California | \n", - "NaN | \n", - "soft, soft-ripened | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "buttery | \n", - "fresh, herbal | \n", - "False | \n", - "False | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "
13 | \n", - "Acorn | \n", - "https://www.cheese.com/acorn/ | \n", - "sheep | \n", - "United Kingdom | \n", - "Bethania | \n", - "NaN | \n", - "hard, artisan | \n", - "52% | \n", - "NaN | \n", - "crumbly, firm | \n", - "NaN | \n", - "NaN | \n", - "burnt caramel, citrusy, herbaceous | \n", - "fruity | \n", - "True | \n", - "False | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "
19 | \n", - "Afuega'l Pitu | \n", - "https://www.cheese.com/afuegal-pitu/ | \n", - "cow | \n", - "Spain | \n", - "Asturias | \n", - "NaN | \n", - "soft, artisan | \n", - "NaN | \n", - "NaN | \n", - "smooth | \n", - "cloth wrapped | \n", - "NaN | \n", - "spicy, strong | \n", - "NaN | \n", - "False | \n", - "False | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "
48 | \n", - "Alpe di Frabosa | \n", - "https://www.cheese.com/alpe-di-frabosa/ | \n", - "cow | \n", - "Italy | \n", - "NaN | \n", - "NaN | \n", - "semi-soft | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "bitter | \n", - "milky, mushroom | \n", - "False | \n", - "False | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "
50 | \n", - "Alpicrème | \n", - "https://www.cheese.com/alpicreme/ | \n", - "goat | \n", - "France | \n", - "NaN | \n", - "NaN | \n", - "soft | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "False | \n", - "False | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "
... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "
1172 | \n", - "Strathdon Blue | \n", - "https://www.cheese.com/strathdon-blue/ | \n", - "cow | \n", - "Scotland | \n", - "Tain | \n", - "Blue | \n", - "semi-soft | \n", - "NaN | \n", - "NaN | \n", - "creamy | \n", - "NaN | \n", - "NaN | \n", - "creamy, spicy | \n", - "aromatic, rich | \n", - "True | \n", - "False | \n", - "NaN | \n", - "NaN | \n", - "Highland Fine Cheeses Limited | \n", - "
1175 | \n", - "String Cheese | \n", - "https://www.cheese.com/string/ | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "semi-hard | \n", - "NaN | \n", - "NaN | \n", - "chewy, firm, stringy | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "
1177 | \n", - "Sulguni | \n", - "https://www.cheese.com/sulguni/ | \n", - "buffalo, cow | \n", - "Georgia | \n", - "Svaneti, Samegrelo | \n", - "NaN | \n", - "semi-firm | \n", - "NaN | \n", - "NaN | \n", - "dense, elastic | \n", - "NaN | \n", - "NaN | \n", - "salty, smokey , sour | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "Georgian Pickle Cheese | \n", - "Megruli Sulguni, Shebolili Megruli Sulguni | \n", - "NaN | \n", - "
1181 | \n", - "Sussex Slipcote | \n", - "https://www.cheese.com/sussex-slipcote/ | \n", - "sheep | \n", - "England | \n", - "NaN | \n", - "NaN | \n", - "soft | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "sharp | \n", - "NaN | \n", - "True | \n", - "False | \n", - "NaN | \n", - "NaN | \n", - "High Weald Dairy | \n", - "
1185 | \n", - "Sweet Style Swiss | \n", - "https://www.cheese.com/sweet-style-swiss/ | \n", - "NaN | \n", - "Switzerland | \n", - "NaN | \n", - "NaN | \n", - "semi-hard, artisan | \n", - "NaN | \n", - "NaN | \n", - "firm, supple | \n", - "waxed | \n", - "NaN | \n", - "nutty | \n", - "nutty, sweet | \n", - "False | \n", - "False | \n", - "NaN | \n", - "NaN | \n", - "NaN | \n", - "
142 rows × 19 columns
\n", - "1181 rows × 13 columns
\n", "" ], "text/plain": [ - " cheese milk country region \\\n", - "0 Aarewasser cow Switzerland NaN \n", - "1 Abbaye de Belloc sheep France Pays Basque \n", - "2 Abbaye de Belval cow France NaN \n", - "3 Abbaye de Citeaux cow France Burgundy \n", - "4 Abbaye de Tamié cow France Savoie \n", - "... ... ... ... ... \n", - "1182 Sveciaost cow Sweden Low-laying regions \n", - "1183 Swag goat Australia South Australia \n", - "1184 Swaledale sheep England Swaledale, North Yorkshire \n", - "1185 Sweet Style Swiss NaN Switzerland NaN \n", - "1186 Swiss cheese cow United States NaN \n", + " cheese milk \\\n", + "12 Ackawi cow, goat, sheep \n", + "116 Baladi cow, goat, sheep \n", + "160 Beemster 2% Milk cow \n", + "212 Blissful Blocks NaN \n", + "213 Blissful Toppings NaN \n", + "243 Bootlegger cow, sheep \n", + "262 Brebis d'Azure sheep \n", + "297 Brunost cow, goat \n", + "300 Bryndza sheep \n", + "311 Burrata water buffalo \n", + "316 Butterkase cow \n", + "367 Cap Cressy goat \n", + "375 Capri Blu goat \n", + "377 Caprice goat \n", + "407 Casu marzu sheep \n", + "437 Cheese Curds NaN \n", + "445 Chhurpi cow, yak \n", + "455 Chura Kampo yak \n", + "508 Cottage Cheese cow \n", + "512 Counting Sheep…and Goats... cow, goat, sheep \n", + "524 Cream Cheesy Bliss NaN \n", + "537 Cressy Blu cow \n", + "569 La Couronne - Fort Aged Comté cow \n", + "601 Lamb Chopper sheep \n", + "621 Le Conquerant Demi Pont L'eveque cow \n", + "646 Limburger cow \n", + "675 Lunetta cow \n", + "701 Mamirolle cow \n", + "776 Monastery Cheeses cow \n", + "789 Monterey Jack cow \n", + "852 Paneer cow, water buffalo \n", + "975 President Fat Free Feta cow \n", + "1001 Purple's a Must cow, goat \n", + "1082 Shanklish cow, sheep \n", + "1099 Shredded Bliss NaN \n", + "1106 Sirene cow, goat, sheep \n", + "1108 Slices Of Bliss NaN \n", + "1123 Sosha goat, yak \n", + "1173 Strawberry Moon cow \n", "\n", - " family type texture \\\n", - "0 NaN semi-soft buttery \n", - "1 NaN semi-hard, artisan creamy, dense, firm \n", - "2 NaN semi-hard elastic \n", - "3 NaN semi-soft, artisan, brined creamy, dense, smooth \n", - "4 NaN soft, artisan creamy, open, smooth \n", - "... ... ... ... \n", - "1182 NaN semi-hard, brined creamy, supple \n", - "1183 NaN fresh firm, artisan creamy, crumbly \n", - "1184 NaN hard semi firm \n", - "1185 NaN semi-hard, artisan firm, supple \n", - "1186 Swiss Cheese hard, artisan, processed firm \n", + " country \\\n", + "12 Cyprus, Egypt, Israel, Jordan, Lebanon, Middle... \n", + "116 Lebanon, Middle East \n", + "160 Canada, Denmark, France, Germany, Netherlands,... \n", + "212 Canada, United States \n", + "213 Canada, United States \n", + "243 Canada, Italy \n", + "262 Canada, Italy \n", + "297 Denmark, Finland, Germany, Iceland, Norway, Sw... \n", + "300 Hungary, Poland, Slovakia \n", + "311 Italy, United States \n", + "316 Austria, Germany \n", + "367 Canada, Italy \n", + "375 Canada, Italy \n", + "377 Canada, Italy \n", + "407 France, Italy \n", + "437 Canada, India, United States \n", + "445 China, Nepal, Tibet \n", + "455 China, Tibet \n", + "508 United Kingdom, United States \n", + "512 Canada, Italy \n", + "524 Canada, United States \n", + "537 Canada, Italy \n", + "569 France, Switzerland \n", + "601 Netherlands, United States \n", + "621 Australia, France \n", + "646 Belgium, Germany, Netherlands \n", + "675 Canada, Italy \n", + "701 Canada, France \n", + "776 Belgium, Canada, France, Switzerland, United S... \n", + "789 Mexico, United States \n", + "852 Bangladesh, India \n", + "975 France, United States \n", + "1001 Canada, Italy \n", + "1082 Egypt, Lebanon, Syria \n", + "1099 Canada, United States \n", + "1106 Albania, Bulgaria, Croatia, Greece, Israel, Ma... \n", + "1108 Canada, United States \n", + "1123 China, Nepal, Tibet \n", + "1173 Canada, Italy \n", "\n", - " rind color flavor aroma \\\n", - "0 washed yellow sweet buttery \n", - "1 natural yellow burnt caramel lanoline \n", - "2 washed ivory NaN aromatic \n", - "3 washed white acidic, milky, smooth barnyardy, earthy \n", - "4 washed white fruity, nutty perfumed, pungent \n", - "... ... ... ... ... \n", - "1182 rindless pale yellow acidic NaN \n", - "1183 ash coated white acidic, creamy fresh \n", - "1184 NaN yellow smooth, sweet floral \n", - "1185 waxed NaN nutty nutty, sweet \n", - "1186 rindless pale yellow nutty, sweet NaN \n", + " region family \\\n", + "12 + Feta \n", + "116 NaN \n", + "160 NaN \n", + "212 Cheddar \n", + "213 Parmesan \n", + "243 Lombardy NaN \n", + "262 Lombardy Blue \n", + "297 NaN \n", + "300 NaN \n", + "311 Apulia Mozzarella \n", + "316 NaN \n", + "367 Lombardy NaN \n", + "375 Lombardy Blue \n", + "377 Lombardy NaN \n", + "407 Sardinia (Italy), Southern Corsica (France) NaN \n", + "437 Cheddar \n", + "445 Cottage \n", + "455 Tibet NaN \n", + "508 Cottage \n", + "512 Lombardy NaN \n", + "524 NaN \n", + "537 Lombardy Blue \n", + "569 Franche Comté NaN \n", + "601 California Gouda \n", + "621 NaN \n", + "646 Duchy of Limburg NaN \n", + "675 Lombardy NaN \n", + "701 Plessisville, Quebec NaN \n", + "776 NaN \n", + "789 Monterey, California Monterey Jack \n", + "852 Cottage \n", + "975 New York Feta \n", + "1001 Lombardy Blue \n", + "1082 Feta \n", + "1099 Mozzarella \n", + "1106 Trakia Feta \n", + "1108 Cheddar \n", + "1123 Tibet NaN \n", + "1173 Lombardy NaN \n", "\n", - " vegetarian vegan \n", - "0 False False \n", - "1 True False \n", - "2 False False \n", - "3 False False \n", - "4 False False \n", - "... ... ... \n", - "1182 False False \n", - "1183 True False \n", - "1184 True False \n", - "1185 False False \n", - "1186 True False \n", + " type texture \\\n", + "12 soft, brined elastic, smooth, springy \n", + "116 fresh soft, artisan creamy, dense, smooth \n", + "160 semi-soft smooth \n", + "212 hard creamy, crumbly \n", + "213 soft crumbly \n", + "243 hard, artisan crumbly, firm \n", + "262 semi-hard, artisan, blue-veined soft \n", + "297 semi-soft, whey dense \n", + "300 soft, artisan spreadable \n", + "311 fresh soft, artisan creamy, stringy \n", + "316 semi-soft creamy, smooth, spreadable \n", + "367 semi-hard, artisan, smear-ripened compact, dense \n", + "375 soft, blue-veined creamy, soft \n", + "377 soft creamy, smooth \n", + "407 soft, soft-ripened soft-ripened \n", + "437 fresh firm firm, springy \n", + "445 soft, hard, artisan dense \n", + "455 hard, artisan dense, dry, firm \n", + "508 soft, artisan, processed creamy, crumbly \n", + "512 soft, soft-ripened creamy, soft \n", + "524 soft creamy, spreadable \n", + "537 semi-hard, blue-veined creamy, crumbly, firm \n", + "569 semi-hard dense \n", + "601 hard dense, firm, smooth \n", + "621 soft, artisan chalky, creamy, soft \n", + "646 semi-soft, smear-ripened crumbly, firm, smooth \n", + "675 fresh soft, artisan creamy \n", + "701 semi-soft, artisan chewy, supple \n", + "776 soft, semi-soft, brined chalky, creamy, firm, grainy \n", + "789 semi-hard compact, creamy, firm, open, supple \n", + "852 fresh firm crumbly, firm \n", + "975 firm, artisan, brined crumbly \n", + "1001 semi-hard, artisan, blue-veined creamy, crumbly \n", + "1082 fresh firm, hard, artisan creamy, crumbly, firm \n", + "1099 semi-soft elastic, smooth, springy, stringy \n", + "1106 fresh soft, brined crumbly, grainy, smooth \n", + "1108 soft creamy \n", + "1123 soft, artisan creamy \n", + "1173 semi-hard, artisan, smear-ripened compact, creamy, dense \n", "\n", - "[1181 rows x 13 columns]" + " rind color flavor \\\n", + "12 natural white mild, milky, salty \n", + "116 rindless white buttery, mild, salty, sweet \n", + "160 NaN NaN nutty \n", + "212 plastic yellow creamy, savory, sharp, spicy \n", + "213 artificial yellow savory, sharp \n", + "243 natural pale yellow fruity, full-flavored, strong \n", + "262 natural pale yellow sharp \n", + "297 natural brown caramel, sweet \n", + "300 rindless white mild, salty \n", + "311 leaf wrapped white buttery, milky \n", + "316 natural pale yellow buttery, mild \n", + "367 washed pale yellow mellow, savory, sweet \n", + "375 natural pale yellow creamy, subtle, sweet \n", + "377 natural white subtle \n", + "407 natural NaN NaN \n", + "437 natural white mild, milky \n", + "445 natural pale yellow tangy \n", + "455 natural NaN NaN \n", + "508 rindless white sweet \n", + "512 NaN white creamy, subtle, sweet \n", + "524 artificial white creamy, garlicky, herbaceous, sweet \n", + "537 natural pale yellow creamy, savory, sweet \n", + "569 NaN pale yellow caramel, nutty, sweet \n", + "601 waxed ivory buttery, caramel, creamy, nutty, sweet \n", + "621 washed NaN creamy, mild \n", + "646 washed straw grassy, mild, mushroomy \n", + "675 natural white creamy, salty \n", + "701 washed ivory buttery, fruity, salty, sweet \n", + "776 washed golden yellow mild, pungent \n", + "789 NaN pale yellow buttery, mild \n", + "852 rindless white milky \n", + "975 natural white herbaceous, salty, tangy \n", + "1001 mold ripened pale yellow full-flavored, strong \n", + "1082 mold ripened white sharp, spicy, strong \n", + "1099 plastic pale yellow mild, milky \n", + "1106 natural white lemony, salty, sharp, tangy \n", + "1108 plastic yellow creamy, savory, sharp, spicy \n", + "1123 natural white pungent, strong \n", + "1173 washed straw subtle, sweet \n", + "\n", + " aroma vegetarian vegan \n", + "12 mild, milky False False \n", + "116 fresh False False \n", + "160 aromatic, floral, fruity False False \n", + "212 NaN True False \n", + "213 NaN True False \n", + "243 floral NaN NaN \n", + "262 aromatic NaN NaN \n", + "297 NaN NaN NaN \n", + "300 NaN NaN NaN \n", + "311 fresh, milky False False \n", + "316 NaN False False \n", + "367 lactic NaN NaN \n", + "375 goaty NaN NaN \n", + "377 goaty NaN NaN \n", + "407 NaN NaN NaN \n", + "437 fresh NaN NaN \n", + "445 NaN NaN NaN \n", + "455 aromatic NaN NaN \n", + "508 NaN True False \n", + "512 nutty NaN NaN \n", + "524 rich True False \n", + "537 NaN NaN NaN \n", + "569 rich NaN NaN \n", + "601 mild, sweet True False \n", + "621 pungent NaN NaN \n", + "646 stinky False False \n", + "675 aromatic, fresh NaN NaN \n", + "701 earthy, pungent False False \n", + "776 pungent, strong False False \n", + "789 aromatic NaN NaN \n", + "852 fresh, milky True False \n", + "975 fresh NaN NaN \n", + "1001 rich NaN NaN \n", + "1082 pungent, strong False False \n", + "1099 fresh, mild True False \n", + "1106 strong False False \n", + "1108 NaN True False \n", + "1123 pungent, strong NaN NaN \n", + "1173 strong NaN NaN " ] }, - "execution_count": 10, + "execution_count": 51, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "data=data.dropna(subset=[\"country\",\"region\"], how=\"all\")\n", - "data" + "print(len(data[data[\"country\"].str.contains(\",\")]))\n", + "data[data[\"country\"].str.contains(\",\")]\n" ] }, { "cell_type": "code", - "execution_count": null, - "id": "e28eb2ee-1bed-4dd7-8133-c99b1f7ea26b", + "execution_count": 52, + "id": "43058589-f931-46ad-99a7-44be63f962cc", "metadata": {}, "outputs": [], - "source": [] + "source": [ + "data=data.drop(index=data[data[\"country\"].str.contains(\",\")].index)" + ] }, { - "cell_type": "code", - "execution_count": 11, - "id": "5a4c0e30-8535-498b-9a9e-0d7d232d4eb7", + "cell_type": "markdown", + "id": "2f42c973-247a-4f51-947e-fbd76f8f12fc", "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/tmp/ipykernel_39592/2649664722.py:2: SettingWithCopyWarning: \n", - "A value is trying to be set on a copy of a slice from a DataFrame.\n", - "Try using .loc[row_indexer,col_indexer] = value instead\n", - "\n", - "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n", - " data[\"country\"]=data[\"country\"].fillna(\"\")\n", - "/tmp/ipykernel_39592/2649664722.py:3: SettingWithCopyWarning: \n", - "A value is trying to be set on a copy of a slice from a DataFrame.\n", - "Try using .loc[row_indexer,col_indexer] = value instead\n", - "\n", - "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n", - " data[\"region\"]=data[\"region\"].fillna(\"\")\n" - ] - } - ], "source": [ - "data[[\"country\",\"region\"]]\n", - "data[\"country\"]=data[\"country\"].fillna(\"\")\n", - "data[\"region\"]=data[\"region\"].fillna(\"\")" + "We removed 39 cheeses because they can come froms several countries. " ] }, { "cell_type": "code", - "execution_count": 35, - "id": "0edcee6f-a2c3-4804-a665-507b77f2651b", + "execution_count": 53, + "id": "59c4e6e7-d624-45a5-a9ea-eb375102b771", "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/tmp/ipykernel_39592/3582726305.py:1: SettingWithCopyWarning: \n", - "A value is trying to be set on a copy of a slice from a DataFrame.\n", - "Try using .loc[row_indexer,col_indexer] = value instead\n", - "\n", - "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n", - " data[\"location\"]=data[\"region\"]+\", \"+data[\"country\"]\n" - ] - } - ], + "outputs": [], "source": [ "data[\"location\"]=data[\"region\"]+\", \"+data[\"country\"]" ] }, { "cell_type": "code", - "execution_count": 36, - "id": "017e30da-4f60-4d16-b6d4-56fb76acb740", + "execution_count": 54, + "id": "0dee0f25-4699-4e46-97d0-21bb36d9c603", "metadata": {}, "outputs": [ { @@ -2190,7 +2417,7 @@ " \n", " \n", "\n", - "1181 rows × 14 columns
\n", + "1142 rows × 14 columns
\n", "" ], "text/plain": [ @@ -2246,10 +2473,10 @@ "1185 False False , Switzerland \n", "1186 True False , United States \n", "\n", - "[1181 rows x 14 columns]" + "[1142 rows x 14 columns]" ] }, - "execution_count": 36, + "execution_count": 54, "metadata": {}, "output_type": "execute_result" } @@ -2260,530 +2487,545 @@ }, { "cell_type": "code", - "execution_count": 37, - "id": "bf9d5b2a-bd47-4c4c-85c4-5ad7769a3f31", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "430" - ] - }, - "execution_count": 37, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "len(set(data[\"location\"]))" - ] - }, - { - "cell_type": "code", - "execution_count": 44, - "id": "e7ae8f76-b33b-42ce-9dea-9fab9e33069e", + "execution_count": null, + "id": "2ef7351c-f117-403b-bc6e-f9f30a98c9d2", "metadata": {}, "outputs": [], - "source": [ - "locs=list(set(loc for loc in data[\"location\"]))" - ] + "source": [] }, { "cell_type": "code", - "execution_count": 49, - "id": "fb044984-c33c-492c-91a2-4e9fff29ceb3", + "execution_count": null, + "id": "353724eb-8d64-4b64-84c6-f06be36acd8b", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "54d56bd4-c83a-4e8c-8751-b4b2f7830a9e", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "bd68f1bb-c9f6-4c57-951b-8ac1f3192f09", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "eeff487e-9b66-4c4b-b4f6-dc5352fb2144", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "cdb0d04c-e0f2-4553-8906-e9282f4942d2", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a551e0f4-3f99-4dae-9b31-6205b772ebf5", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7c02cc29-fe07-4ff9-8c6b-8638d37830cd", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "de579631-a29c-4620-9bbf-7085b83d16b7", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 55, + "id": "e2e868d4-33a1-4602-af97-afb1d29e612f", "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['Oristano, Italy',\n", - " 'Isere, France',\n", - " 'Romanian Carpathians, Romania',\n", - " 'French Basque Country, Midi-Pyrénées, France',\n", - " 'Kilmallock County Limerick, Ireland',\n", - " ', Australia',\n", - " 'massif des Causses, France',\n", - " 'Basque, Pyrenees Mountains, France',\n", - " 'Modena, Italy',\n", - " 'Vermont, United States',\n", - " 'Rhone-Alps, France',\n", - " 'Brooklyn NY, United States',\n", - " 'Coast of Oregon, United States',\n", - " 'Veneto, Trentino, Italy',\n", - " 'Emilia Romagna, Italy',\n", - " ', Middle East',\n", - " 'Carmarthenshire, Wales',\n", - " ', Egypt, Lebanon, Syria',\n", - " 'Jura, Switzerland',\n", - " ', Australia, France',\n", - " 'Rio Grande do Sul, Brazil',\n", - " ', Turkey',\n", - " 'Banks Peninsular in Canterbury, New Zealand',\n", - " 'Loire Valley, France',\n", - " 'Berry, France',\n", - " 'Seattle, Washington, United States',\n", - " 'Marathon, NY, United States',\n", - " 'Setubal, Palmela and Sesimbra, Portugal',\n", - " 'Central Balkan Mountains, Bulgaria',\n", - " 'North Wootton, England',\n", - " 'Allagau, Bavarian Alps, Germany',\n", - " 'Colorado, United States',\n", - " ', Armenia',\n", - " 'Lebanon, CT, United States',\n", - " 'Centre-Val de Loire, France',\n", - " 'Barcelona, Spain',\n", - " 'South West England, England',\n", - " 'Laqueuille, France',\n", - " 'Fethard, Co Tipperary, Ireland',\n", - " 'Mornington Peninsula, Melbourne, Australia',\n", - " 'Odell, Bedfordshire, England, Great Britain, United Kingdom',\n", - " 'Shelburne Farms, United States',\n", - " ', Israel',\n", - " 'South Australia, Australia',\n", - " 'Bornholm, Denmark',\n", - " 'Pyrénées, France',\n", - " 'Sardinia & Campania, Italy',\n", - " 'Hunter Valley, Australia',\n", - " 'Greenville, Indiana, United States',\n", - " 'Pokolbin, Hunter Valley, Australia',\n", - " 'Landford, England, Great Britain, United Kingdom',\n", - " 'Carrigtwohill, Ireland',\n", - " 'Minnesota, United States',\n", - " 'Lombardy, Italy',\n", - " 'County Cavan, Ireland',\n", + "{', Afghanistan',\n", " ', Argentina',\n", - " ', France',\n", - " 'Avila, Spain',\n", - " 'Crotone, Italy',\n", - " 'New Hampshire, United States',\n", - " ', Serbia',\n", - " 'Lombardy, Canada, Italy',\n", - " 'Pays d’Auge, Normandy, France',\n", - " 'Wisconsin, United States',\n", - " 'Tomales, California, United States',\n", - " ', Netherlands',\n", - " 'Serra da Estrela, Portugal',\n", - " 'St. Gallen (canton), Tufertschwil, Switzerland',\n", - " 'Extremadura, Spain',\n", - " ', Spain',\n", - " 'Pesaro-Urbino, Italy',\n", - " 'New York, France, United States',\n", - " 'Northern Holland, Netherlands',\n", - " 'South West England, United Kingdom',\n", - " 'Mankato, MN, United States',\n", - " 'Charentes-Poitou, France',\n", - " 'Postel, Belgium',\n", - " 'Auvergne, Salers, France',\n", - " 'Leiden, Netherlands',\n", - " 'Apulia, Italy, United States',\n", - " ', Afghanistan',\n", - " 'Canary Islands, Spain',\n", - " ', Great Britain, United Kingdom, Wales',\n", - " 'Oregon Coast Range, United States',\n", - " 'Calabria, Italy',\n", - " 'Utah, United States',\n", - " 'Gâtinais, France',\n", - " 'North Yorkshire, England',\n", - " 'Carnia, Italy',\n", - " 'Passendale, Belgium',\n", - " \"Lucerne, Schwyz, Unterwald, and Zoug, and the following additional places: Muri district in d'Argovi, Switzerland\",\n", - " 'Carrigtwohill, ',\n", - " 'Adamstown, Co Wexford, Ireland',\n", - " 'Bermondsey, London, England, Great Britain, United Kingdom',\n", - " 'Lapland, Finland',\n", - " 'Tasmania, Australia',\n", - " 'Staffordshire, England, Great Britain, United Kingdom',\n", - " 'Ile de France, France',\n", - " 'Lodi, Italy',\n", - " 'Macedonia, Thrace, Thessalia, Peloponissos, Ionian Islands, Aegean islands, Crete Island and Epirus, Greece',\n", - " ', United Kingdom, United States',\n", - " 'Southern California, United States',\n", - " 'South West England, England, United Kingdom',\n", - " 'Haute Vienne, France',\n", - " 'Menorca, Balearic Islands, Spain',\n", - " 'Aberdeenshire, Scotland',\n", - " 'Kimball, United States',\n", - " 'Schoonrewoerd, Leerdam, Netherlands',\n", - " 'Friuli-Venezia Giulia, Italy',\n", - " 'Larzac, France',\n", - " 'Nottinghamshire, England, Great Britain, United Kingdom',\n", - " 'Charm, Ohio, United States',\n", - " 'Troyes , Aube, France',\n", - " ', Denmark, Finland, Germany, Iceland, Norway, Sweden',\n", - " 'Québec, Canada',\n", - " 'Herault, France',\n", - " 'Pullman, Washington, United States',\n", - " 'Dumfries, Scotland',\n", - " 'Tieton, Washington, United States',\n", - " 'Murazzano, Italy',\n", - " 'Pennsylvania, United States',\n", - " 'Co. Carlow, Ireland',\n", - " 'Languedoc-Roussillon, France',\n", - " 'Aquitaine, France',\n", - " 'Franche Comté, France, Switzerland',\n", - " 'Duhallow, Ireland',\n", - " 'Gippsland, Victoria, Australia',\n", - " 'British Columbia, Canada',\n", - " ', Austria, Germany',\n", - " 'Hamilton, New Zealand',\n", - " 'Roncq, France',\n", - " 'St. Louis, Missouri, United States',\n", - " 'Iowa, United States',\n", - " 'Burgund, France',\n", - " 'Pembrokeshire, Great Britain, United Kingdom, Wales',\n", - " 'Ballarat, Victoria, Australia',\n", - " 'Nord-Pas-de-Calais, France',\n", - " 'Aconcagua, Chile',\n", - " 'Massachusetts, United States',\n", - " 'North Yorkshire, England, Great Britain, United Kingdom',\n", - " 'Bregenzerwald, Kleinwalsertal, Großwalsertal, Laiblachtal (Pfänderstock) and Rheintal, Austria',\n", - " ', Denmark',\n", - " 'Ile-de-France/Champagne, France',\n", - " 'Castilla Leon, Spain',\n", - " 'Asiago, Italy',\n", - " 'Manitoba, Canada',\n", - " 'Cheshire, England, Great Britain, United Kingdom',\n", - " 'County Tipperary, Clogheen, Ireland',\n", - " 'Valpadana, Italy',\n", - " 'Severn Valley, England, Great Britain, United Kingdom',\n", - " 'Co Clare, Ireland',\n", - " 'Timsbury, Somerset, England, Great Britain, United Kingdom',\n", - " 'Somerset, England, Great Britain, United Kingdom',\n", - " 'Greensboro, VT, United States',\n", - " 'Dorset, England, Great Britain, United Kingdom',\n", - " 'Orkney Islands, Great Britain, Scotland, United Kingdom',\n", - " 'East Midlands, England',\n", - " 'Northeastern Brazil, Brazil',\n", - " 'NY, United States',\n", - " ', England, Great Britain, United Kingdom',\n", - " 'Alba, Italy',\n", - " 'Fife, Scotland',\n", - " 'Stranraer, England, Scotland, United Kingdom',\n", - " 'Castelo Branco, Fundão and Idanha-a-Nova, Portugal',\n", - " 'Moliterno, Italy',\n", - " 'Dorset, England',\n", - " 'Cornwall, England, Great Britain, United Kingdom',\n", - " 'Northwest, United States',\n", - " 'Carneros, Sonoma, California, United States',\n", - " 'Croisy-sur-Eure, France',\n", - " 'Pyrenees-Atlantiques, France',\n", - " 'Västra Götaland, Sweden',\n", - " 'Brisbane, Australia',\n", - " 'Campania, Paestum, Foggia, Italy',\n", - " 'Cevenes, France',\n", - " ', England',\n", - " 'Corsica, France',\n", + " ', Armenia',\n", + " ', Australia',\n", " ', Austria',\n", - " 'Ann Arbor, Michigan, United States',\n", - " 'Po valley region, Italy',\n", - " 'Banon, France',\n", - " 'Herefordshire, West Midlands, United Kingdom',\n", - " 'Zasavica, Serbia',\n", - " ', United Kingdom, Wales',\n", - " 'Lower Normandy, France',\n", - " 'Piave Valley, Italy, Italy',\n", - " 'Nicasio, United States',\n", - " 'Beara Peninsula, Co. Cork, Ireland',\n", - " 'Cotswolds, England, Great Britain, United Kingdom',\n", - " 'Missouri, United States',\n", - " 'Rhone Valley, France',\n", - " 'California, United States',\n", - " 'Oxfordshire, Great Britain',\n", - " 'Petaluma, California, United States',\n", - " 'Prince Edward Island, Canada',\n", - " 'North Cornwall, England',\n", - " 'Coquet, England',\n", - " 'Emilia-Romagna, Italy',\n", - " 'Castille-Leon, Spain',\n", - " ', Cyprus',\n", - " 'Bethania, United Kingdom',\n", - " 'Puimichel in Provence Alpes, France',\n", - " 'Gloucestershire County, England, United Kingdom',\n", - " 'Galicia, Spain',\n", - " 'Flanders, Belgium',\n", - " ', Canada, Denmark, France, Germany, Netherlands, United States',\n", - " 'Lanarkshire, Great Britain, Scotland, United Kingdom',\n", - " 'Pays Basque, France',\n", - " 'Veneto, Italy',\n", - " ', Scotland',\n", - " 'Victoria, Australia',\n", - " 'Co Limerick, Ireland',\n", - " 'Treviso, Veneto, Italy',\n", - " 'Wales, Great Britain',\n", - " 'Serra da Canastra, Minas Gerais state, Brazil',\n", - " 'Devon, England, United Kingdom',\n", - " 'Gevrey-Chambertin, Burgundy, France',\n", - " ', Brazil',\n", - " 'Gloucestershire, England, Great Britain, United Kingdom',\n", - " 'Averyon, France',\n", - " 'Midi-Pyrénées, France',\n", - " 'Tipperary, Ireland',\n", - " 'Maribo, Denmark',\n", - " 'province of Brittany, France',\n", - " 'Bavaria, Germany',\n", - " ', United States',\n", - " 'Northern Wisconsin, United States',\n", - " 'New York, United States',\n", - " 'Blarney, Ireland',\n", - " 'Stewarton, Scotland, United Kingdom',\n", - " 'Monterey, California, United States',\n", - " 'Wigtownshire, Scotland',\n", - " 'Cornwall, England',\n", - " 'Co. Offaly, Ireland',\n", - " 'Karlovy Vary, Czech Republic',\n", - " 'Quebec, Canada',\n", - " 'Laruns, France',\n", - " 'Maine, United States',\n", - " ', Mauritania',\n", - " 'Piemonte, Italy',\n", - " 'Brittany, France',\n", - " 'Poitou-Charentes, France',\n", - " 'Swaledale, North Yorkshire, England',\n", - " 'Timsbury, Somerset, England, Scotland, Wales',\n", - " ', Iceland',\n", - " 'Oviken, Sweden',\n", - " 'Pyrénées-Atlantiques, France',\n", - " 'Pinconning, Michigan, United States',\n", - " 'Belvederis, Lithuania',\n", - " 'Chelmarsh, Bridgnorth, Shropshire, England',\n", - " 'Peekskill, United States',\n", - " 'Ceredigion, United Kingdom',\n", - " 'All Holland, Netherlands',\n", - " 'Normandy, France',\n", - " 'Inagh, Co Clare, ',\n", - " 'Amou, Gascony, France',\n", - " 'Colby, Wisconsin, United States',\n", - " 'Southwestern Wisconsin, United States',\n", - " 'Lincolnshire, England, United Kingdom',\n", - " 'Bas-Languedoc, Comtat Venaissin, France',\n", - " ', United Kingdom',\n", - " ', Switzerland',\n", - " ', Portugal',\n", - " 'Comox Valley, Vancouver Island, Canada',\n", - " 'Derbyshire, Leicestershire, Nottinghamshire, England',\n", - " 'Huizen, Netherlands',\n", - " 'Asturias, Spain',\n", - " 'Piedmont, Italy',\n", - " ', Canada, India, United States',\n", - " 'County Antrim, Ireland',\n", - " ', Italy',\n", - " 'St Antoine, France',\n", - " ', Hungary',\n", - " 'County Carlow, Ireland',\n", - " 'Provencale, France',\n", - " ', Sweden',\n", - " 'Allgau, Germany',\n", - " 'North Carolina, United States',\n", - " 'Basilicata, Italy',\n", - " ', Canada',\n", - " 'Beira Baixa Province, Portugal',\n", - " 'Ann Arbor, MI, United States',\n", - " ', China, Nepal, Tibet',\n", - " 'Bursa, Turkey',\n", - " 'Websterville, VT, United States',\n", - " 'Kent, United Kingdom',\n", - " 'County Wexford, Ireland',\n", - " 'island wide, Cyprus',\n", - " 'Pyrenees, France',\n", - " ', Mexico',\n", - " 'Duchy of Limburg, Belgium, Germany, Netherlands',\n", - " 'Cotherstone, England, United Kingdom',\n", - " 'Richfield, Wisconsin, United States',\n", - " 'Pienza, Italy',\n", - " 'Dalmatia, Croatia',\n", - " 'Taxco, Mexico',\n", - " 'Plessisville, Quebec, Canada, France',\n", - " ', Lebanon, Middle East',\n", - " 'Mols, Denmark',\n", - " '+, Cyprus, Egypt, Israel, Jordan, Lebanon, Middle East, Syria',\n", - " 'Prince Edward County, Ontario, Canada',\n", " ', Belgium',\n", - " 'Auvergne, France',\n", - " ', Canada, United States',\n", - " 'Upper Corsica, France',\n", - " 'New South Wales, Australia',\n", - " 'Tibet, China, Nepal, Tibet',\n", - " 'West Bengal, India',\n", - " ', Iraq',\n", - " 'Béarnaise in Pyrénées-Atlantique, France',\n", - " 'Co. Cork, Ireland',\n", - " 'Vorarlberg, Austria',\n", - " 'Midi-Pyrenees, France',\n", - " ', Ireland',\n", - " 'Wallonia, Belgium',\n", - " 'Devon, England',\n", - " 'South East England, United Kingdom',\n", - " 'Indiana, United States',\n", - " 'Island of Pag, Croatia',\n", - " 'Sonoma, California, United States',\n", - " 'Port Townsend, United States',\n", - " 'old Liburnia (Dalmatia), Croatia',\n", - " ', Mexico and Caribbean',\n", - " 'North Yorkshire, England, United Kingdom',\n", - " 'Charentes, France',\n", - " 'La Velle, Wisconsin, United States',\n", + " ', Brazil',\n", + " ', Canada',\n", + " ', Cyprus',\n", + " ', Denmark',\n", + " ', England',\n", + " ', France',\n", " ', Germany',\n", - " 'Monterey, California, Mexico, United States',\n", - " 'Roxburghshire, Scotland, United Kingdom',\n", - " 'Minas Gerais, Brazil',\n", - " 'Sardinia (Italy), Southern Corsica (France), France, Italy',\n", - " ', Hungary, Poland, Slovakia',\n", - " 'Allgaeu Alps, Germany',\n", - " 'Orkney Isles, Scotland, United Kingdom',\n", - " 'East Sussex, United Kingdom',\n", - " 'Póvoa de Lanhoso, Portugal',\n", - " 'Central and Western Macedonia, Thessalia, Greece',\n", - " 'Friuli Venezia Giulia and Veneto, Italy',\n", - " 'Somerset, England, United Kingdom',\n", - " 'Brickhill, Co. Clare, Ireland',\n", - " 'New York, France',\n", - " 'Burgundy, France',\n", - " ', Holland',\n", - " 'Gujarat, India',\n", - " 'Pembrokeshire, United Kingdom',\n", - " 'Milford, NJ, United States',\n", - " 'Campania, Italy',\n", - " ', Mongolia',\n", - " 'Valencia, Spain',\n", - " 'Tibet, China, Tibet',\n", - " 'Bourgogne, France',\n", - " 'Bjurholm, Sweden',\n", - " 'Het Groene Hart, Netherlands',\n", - " 'Kinfauns, Perthshire, Scotland',\n", - " 'Stoneyford, Ireland',\n", - " 'West Pawlet, VT, United States',\n", - " 'Sebastopol, California, United States',\n", - " 'Airedale farming district, New Zealand',\n", - " 'Wales, London, United Kingdom, Wales',\n", - " 'Tain, Scotland',\n", - " 'Naples, Italy',\n", - " 'Chirac, France',\n", - " 'Fornells de la Selva, Gironès, Spain',\n", - " 'Canton of Glarus, Switzerland',\n", - " ', Belgium, Canada, France, Switzerland, United States',\n", - " 'Tuscany, Italy',\n", - " 'Haute-Savoie / Upper Savoy, France',\n", - " 'Cornwall, ',\n", - " 'Centre , the department of Loiret, France',\n", - " ', Poland',\n", - " 'Rhône-Alpes, France',\n", - " 'Trakia, Albania, Bulgaria, Croatia, Greece, Israel, Macedonia, Romania, Serbia',\n", - " 'Somerset, England',\n", - " 'North East Victoria, Australia',\n", - " 'Sardegna, Italy',\n", - " 'Fairview, United States',\n", - " 'Murcia, Spain',\n", - " 'Languedoc, France',\n", - " 'Veneto, ',\n", - " 'Umbria, Lazio, Italy',\n", - " 'Sulzberg, Austria',\n", - " 'Queenstown, New Zealand',\n", - " 'Bergues, France',\n", - " 'Piora Valley, Switzerland',\n", - " 'Savoie, France',\n", - " 'Galax, Virginia, United States',\n", - " ', New Zealand',\n", - " 'Devon, England, Great Britain, United Kingdom',\n", - " 'Avesnes, France',\n", - " 'Dumfriesshire, Scotland, United Kingdom',\n", " ', Greece',\n", - " 'Franche Comté, France',\n", - " 'Ontario, Canada',\n", - " 'North East Victoria, ',\n", - " 'Oregon, United States',\n", - " 'Loire, France',\n", - " 'Friuli-Venezia Giulia and the Veneto, Italy',\n", - " 'Virginia, United States',\n", - " 'Central and Western Macedonia, Thessaly, Greece',\n", - " 'Co. Mayo, Ireland',\n", - " 'Normandy, Auvilliers, France',\n", - " 'Bloomdale, United States',\n", - " 'Azores, Portugal',\n", - " 'Georgia, United States',\n", - " 'Swabia, Germany',\n", - " 'Äänekoski, Finland',\n", - " 'Lazio, Sardinia, Italy',\n", - " 'Buxton, Derbyshire, England, United Kingdom',\n", - " 'Inagh, Co Clare, Ireland',\n", - " 'Landshut, Germany',\n", - " 'East Midlands, England, Great Britain, United Kingdom',\n", - " 'East Midlands, England, United Kingdom',\n", - " 'Stawley, near Wellington, Somerset, England, Great Britain, United Kingdom',\n", - " 'Allgäu, Germany',\n", - " ', Bangladesh, India',\n", - " 'Stonegate, East Sussex, England, Great Britain, United Kingdom',\n", - " 'Castile-Leon, Spain',\n", - " 'New Jersey, United States',\n", - " 'Svaneti, Samegrelo, Georgia',\n", - " 'Low-laying regions, Sweden',\n", - " 'California, Netherlands, United States',\n", - " 'Gravina in Puglia, Murgia, Italy',\n", - " 'Aveyron, Laguiole, France',\n", - " 'Provence, France',\n", - " 'Illoud (Haute-Marne), France',\n", - " 'Cumbrian, United Kingdom',\n", + " ', Holland',\n", + " ', Hungary',\n", + " ', Iceland',\n", + " ', Iraq',\n", + " ', Ireland',\n", + " ', Israel',\n", + " ', Italy',\n", + " ', Mauritania',\n", + " ', Mexico',\n", + " ', Mexico and Caribbean',\n", + " ', Middle East',\n", + " ', Mongolia',\n", + " ', Netherlands',\n", + " ', New Zealand',\n", + " ', Poland',\n", + " ', Portugal',\n", + " ', Scotland',\n", + " ', Serbia',\n", + " ', Spain',\n", + " ', Sweden',\n", + " ', Switzerland',\n", + " ', Turkey',\n", + " ', United Kingdom',\n", + " ', United States',\n", " ', Wales',\n", - " 'Illinois, United States',\n", + " 'Aberdeenshire, Scotland',\n", + " 'Aconcagua, Chile',\n", + " 'Adamstown, Co Wexford, Ireland',\n", + " 'Airedale farming district, New Zealand',\n", + " 'Alba, Italy',\n", + " 'All Holland, Netherlands',\n", + " 'Allagau, Bavarian Alps, Germany',\n", + " 'Allgaeu Alps, Germany',\n", + " 'Allgau, Germany',\n", + " 'Allgäu, Germany',\n", + " 'Amou, Gascony, France',\n", + " 'Anjou, France',\n", + " 'Ann Arbor, MI, United States',\n", + " 'Ann Arbor, Michigan, United States',\n", + " 'Aquitaine, France',\n", + " 'Asiago, Italy',\n", + " 'Asturias, Spain',\n", + " 'Auvergne, France',\n", + " 'Auvergne, Salers, France',\n", + " 'Averyon, France',\n", + " 'Avesnes, France',\n", " 'Aveyron, France',\n", - " 'Anjou, France']" + " 'Aveyron, Laguiole, France',\n", + " 'Avila, Spain',\n", + " 'Azores, Portugal',\n", + " 'Ballarat, Victoria, Australia',\n", + " 'Banks Peninsular in Canterbury, New Zealand',\n", + " 'Banon, France',\n", + " 'Barcelona, Spain',\n", + " 'Bas-Languedoc, Comtat Venaissin, France',\n", + " 'Basilicata, Italy',\n", + " 'Basque, Pyrenees Mountains, France',\n", + " 'Bavaria, Germany',\n", + " 'Beara Peninsula, Co. Cork, Ireland',\n", + " 'Beira Baixa Province, Portugal',\n", + " 'Belvederis, Lithuania',\n", + " 'Bergues, France',\n", + " 'Bermondsey, London, England',\n", + " 'Berry, France',\n", + " 'Bethania, United Kingdom',\n", + " 'Bjurholm, Sweden',\n", + " 'Blarney, Ireland',\n", + " 'Bloomdale, United States',\n", + " 'Bornholm, Denmark',\n", + " 'Bourgogne, France',\n", + " 'Bregenzerwald, Kleinwalsertal, Großwalsertal, Laiblachtal (Pfänderstock) and Rheintal, Austria',\n", + " 'Brickhill, Co. Clare, Ireland',\n", + " 'Brisbane, Australia',\n", + " 'British Columbia, Canada',\n", + " 'Brittany, France',\n", + " 'Brooklyn NY, United States',\n", + " 'Burgund, France',\n", + " 'Burgundy, France',\n", + " 'Bursa, Turkey',\n", + " 'Buxton, Derbyshire, England',\n", + " 'Béarnaise in Pyrénées-Atlantique, France',\n", + " 'Calabria, Italy',\n", + " 'California, United States',\n", + " 'Campania, Italy',\n", + " 'Campania, Paestum, Foggia, Italy',\n", + " 'Canary Islands, Spain',\n", + " 'Canton of Glarus, Switzerland',\n", + " 'Carmarthenshire, Wales',\n", + " 'Carneros, Sonoma, California, United States',\n", + " 'Carnia, Italy',\n", + " 'Carrigtwohill, ',\n", + " 'Carrigtwohill, Ireland',\n", + " 'Castelo Branco, Fundão and Idanha-a-Nova, Portugal',\n", + " 'Castile-Leon, Spain',\n", + " 'Castilla Leon, Spain',\n", + " 'Castille-Leon, Spain',\n", + " 'Central Balkan Mountains, Bulgaria',\n", + " 'Central and Western Macedonia, Thessalia, Greece',\n", + " 'Central and Western Macedonia, Thessaly, Greece',\n", + " 'Centre , the department of Loiret, France',\n", + " 'Centre-Val de Loire, France',\n", + " 'Ceredigion, United Kingdom',\n", + " 'Cevenes, France',\n", + " 'Charentes, France',\n", + " 'Charentes-Poitou, France',\n", + " 'Charm, Ohio, United States',\n", + " 'Chelmarsh, Bridgnorth, Shropshire, England',\n", + " 'Cheshire, England',\n", + " 'Chirac, France',\n", + " 'Co Clare, Ireland',\n", + " 'Co Limerick, Ireland',\n", + " 'Co. Carlow, Ireland',\n", + " 'Co. Cork, Ireland',\n", + " 'Co. Mayo, Ireland',\n", + " 'Co. Offaly, Ireland',\n", + " 'Coast of Oregon, United States',\n", + " 'Colby, Wisconsin, United States',\n", + " 'Colorado, United States',\n", + " 'Comox Valley, Vancouver Island, Canada',\n", + " 'Coquet, England',\n", + " 'Cornwall, ',\n", + " 'Cornwall, England',\n", + " 'Corsica, France',\n", + " 'Cotherstone, England',\n", + " 'Cotswolds, England',\n", + " 'County Antrim, Ireland',\n", + " 'County Carlow, Ireland',\n", + " 'County Cavan, Ireland',\n", + " 'County Tipperary, Clogheen, Ireland',\n", + " 'County Wexford, Ireland',\n", + " 'Croisy-sur-Eure, France',\n", + " 'Crotone, Italy',\n", + " 'Cumbrian, United Kingdom',\n", + " 'Dalmatia, Croatia',\n", + " 'Derbyshire, Leicestershire, Nottinghamshire, England',\n", + " 'Devon, England',\n", + " 'Dorset, England',\n", + " 'Duhallow, Ireland',\n", + " 'Dumfries, Scotland',\n", + " 'Dumfriesshire, Scotland',\n", + " 'East Midlands, England',\n", + " 'East Sussex, United Kingdom',\n", + " 'Emilia Romagna, Italy',\n", + " 'Emilia-Romagna, Italy',\n", + " 'Extremadura, Spain',\n", + " 'Fairview, United States',\n", + " 'Fethard, Co Tipperary, Ireland',\n", + " 'Fife, Scotland',\n", + " 'Flanders, Belgium',\n", + " 'Fornells de la Selva, Gironès, Spain',\n", + " 'Franche Comté, France',\n", + " 'French Basque Country, Midi-Pyrénées, France',\n", + " 'Friuli Venezia Giulia and Veneto, Italy',\n", + " 'Friuli-Venezia Giulia and the Veneto, Italy',\n", + " 'Friuli-Venezia Giulia, Italy',\n", + " 'Galax, Virginia, United States',\n", + " 'Galicia, Spain',\n", + " 'Georgia, United States',\n", + " 'Gevrey-Chambertin, Burgundy, France',\n", + " 'Gippsland, Victoria, Australia',\n", + " 'Gloucestershire County, England',\n", + " 'Gloucestershire, England',\n", + " 'Gravina in Puglia, Murgia, Italy',\n", + " 'Greensboro, VT, United States',\n", + " 'Greenville, Indiana, United States',\n", + " 'Gujarat, India',\n", + " 'Gâtinais, France',\n", + " 'Hamilton, New Zealand',\n", + " 'Haute Vienne, France',\n", + " 'Haute-Savoie / Upper Savoy, France',\n", + " 'Herault, France',\n", + " 'Herefordshire, West Midlands, United Kingdom',\n", + " 'Het Groene Hart, Netherlands',\n", + " 'Huizen, Netherlands',\n", + " 'Hunter Valley, Australia',\n", + " 'Ile de France, France',\n", + " 'Ile-de-France/Champagne, France',\n", + " 'Illinois, United States',\n", + " 'Illoud (Haute-Marne), France',\n", + " 'Inagh, Co Clare, ',\n", + " 'Inagh, Co Clare, Ireland',\n", + " 'Indiana, United States',\n", + " 'Iowa, United States',\n", + " 'Isere, France',\n", + " 'Island of Pag, Croatia',\n", + " 'Jura, Switzerland',\n", + " 'Karlovy Vary, Czech Republic',\n", + " 'Kent, United Kingdom',\n", + " 'Kilmallock County Limerick, Ireland',\n", + " 'Kimball, United States',\n", + " 'Kinfauns, Perthshire, Scotland',\n", + " 'La Velle, Wisconsin, United States',\n", + " 'Lanarkshire, Scotland',\n", + " 'Landford, England',\n", + " 'Landshut, Germany',\n", + " 'Languedoc, France',\n", + " 'Languedoc-Roussillon, France',\n", + " 'Lapland, Finland',\n", + " 'Laqueuille, France',\n", + " 'Laruns, France',\n", + " 'Larzac, France',\n", + " 'Lazio, Sardinia, Italy',\n", + " 'Lebanon, CT, United States',\n", + " 'Leiden, Netherlands',\n", + " 'Lincolnshire, England',\n", + " 'Lodi, Italy',\n", + " 'Loire Valley, France',\n", + " 'Loire, France',\n", + " 'Lombardy, Italy',\n", + " 'Low-laying regions, Sweden',\n", + " 'Lower Normandy, France',\n", + " \"Lucerne, Schwyz, Unterwald, and Zoug, and the following additional places: Muri district in d'Argovi, Switzerland\",\n", + " 'Macedonia, Thrace, Thessalia, Peloponissos, Ionian Islands, Aegean islands, Crete Island and Epirus, Greece',\n", + " 'Maine, United States',\n", + " 'Manitoba, Canada',\n", + " 'Mankato, MN, United States',\n", + " 'Marathon, NY, United States',\n", + " 'Maribo, Denmark',\n", + " 'Massachusetts, United States',\n", + " 'Menorca, Balearic Islands, Spain',\n", + " 'Midi-Pyrenees, France',\n", + " 'Midi-Pyrénées, France',\n", + " 'Milford, NJ, United States',\n", + " 'Minas Gerais, Brazil',\n", + " 'Minnesota, United States',\n", + " 'Missouri, United States',\n", + " 'Modena, Italy',\n", + " 'Moliterno, Italy',\n", + " 'Mols, Denmark',\n", + " 'Monterey, California, United States',\n", + " 'Mornington Peninsula, Melbourne, Australia',\n", + " 'Murazzano, Italy',\n", + " 'Murcia, Spain',\n", + " 'NY, United States',\n", + " 'Naples, Italy',\n", + " 'New Hampshire, United States',\n", + " 'New Jersey, United States',\n", + " 'New South Wales, Australia',\n", + " 'New York, France',\n", + " 'New York, United States',\n", + " 'Nicasio, United States',\n", + " 'Nord-Pas-de-Calais, France',\n", + " 'Normandy, Auvilliers, France',\n", + " 'Normandy, France',\n", + " 'North Carolina, United States',\n", + " 'North Cornwall, England',\n", + " 'North East Victoria, ',\n", + " 'North East Victoria, Australia',\n", + " 'North Wootton, England',\n", + " 'North Yorkshire, England',\n", + " 'Northeastern Brazil, Brazil',\n", + " 'Northern Holland, Netherlands',\n", + " 'Northern Wisconsin, United States',\n", + " 'Northwest, United States',\n", + " 'Nottinghamshire, England',\n", + " 'Odell, Bedfordshire, England',\n", + " 'Ontario, Canada',\n", + " 'Oregon Coast Range, United States',\n", + " 'Oregon, United States',\n", + " 'Oristano, Italy',\n", + " 'Orkney Islands, Scotland',\n", + " 'Orkney Isles, Scotland',\n", + " 'Oviken, Sweden',\n", + " 'Oxfordshire, Great Britain',\n", + " 'Passendale, Belgium',\n", + " 'Pays Basque, France',\n", + " 'Pays d’Auge, Normandy, France',\n", + " 'Peekskill, United States',\n", + " 'Pembrokeshire, United Kingdom',\n", + " 'Pembrokeshire, Wales',\n", + " 'Pennsylvania, United States',\n", + " 'Pesaro-Urbino, Italy',\n", + " 'Petaluma, California, United States',\n", + " 'Piave Valley, Italy, Italy',\n", + " 'Piedmont, Italy',\n", + " 'Piemonte, Italy',\n", + " 'Pienza, Italy',\n", + " 'Pinconning, Michigan, United States',\n", + " 'Piora Valley, Switzerland',\n", + " 'Po valley region, Italy',\n", + " 'Poitou-Charentes, France',\n", + " 'Pokolbin, Hunter Valley, Australia',\n", + " 'Port Townsend, United States',\n", + " 'Postel, Belgium',\n", + " 'Prince Edward County, Ontario, Canada',\n", + " 'Prince Edward Island, Canada',\n", + " 'Provencale, France',\n", + " 'Provence, France',\n", + " 'Puimichel in Provence Alpes, France',\n", + " 'Pullman, Washington, United States',\n", + " 'Pyrenees, France',\n", + " 'Pyrenees-Atlantiques, France',\n", + " 'Pyrénées, France',\n", + " 'Pyrénées-Atlantiques, France',\n", + " 'Póvoa de Lanhoso, Portugal',\n", + " 'Quebec, Canada',\n", + " 'Queenstown, New Zealand',\n", + " 'Québec, Canada',\n", + " 'Rhone Valley, France',\n", + " 'Rhone-Alps, France',\n", + " 'Rhône-Alpes, France',\n", + " 'Richfield, Wisconsin, United States',\n", + " 'Rio Grande do Sul, Brazil',\n", + " 'Romanian Carpathians, Romania',\n", + " 'Roncq, France',\n", + " 'Roxburghshire, Scotland',\n", + " 'Sardegna, Italy',\n", + " 'Sardinia & Campania, Italy',\n", + " 'Savoie, France',\n", + " 'Schoonrewoerd, Leerdam, Netherlands',\n", + " 'Seattle, Washington, United States',\n", + " 'Sebastopol, California, United States',\n", + " 'Serra da Canastra, Minas Gerais state, Brazil',\n", + " 'Serra da Estrela, Portugal',\n", + " 'Setubal, Palmela and Sesimbra, Portugal',\n", + " 'Severn Valley, England',\n", + " 'Shelburne Farms, United States',\n", + " 'Somerset, England',\n", + " 'Sonoma, California, United States',\n", + " 'South Australia, Australia',\n", + " 'South East England, United Kingdom',\n", + " 'South West England, England',\n", + " 'South West England, United Kingdom',\n", + " 'Southern California, United States',\n", + " 'Southwestern Wisconsin, United States',\n", + " 'St Antoine, France',\n", + " 'St. Gallen (canton), Tufertschwil, Switzerland',\n", + " 'St. Louis, Missouri, United States',\n", + " 'Staffordshire, England',\n", + " 'Stawley, near Wellington, Somerset, England',\n", + " 'Stewarton, Scotland',\n", + " 'Stonegate, East Sussex, England',\n", + " 'Stoneyford, Ireland',\n", + " 'Stranraer, Scotland',\n", + " 'Sulzberg, Austria',\n", + " 'Svaneti, Samegrelo, Georgia',\n", + " 'Swabia, Germany',\n", + " 'Swaledale, North Yorkshire, England',\n", + " 'Tain, Scotland',\n", + " 'Tasmania, Australia',\n", + " 'Taxco, Mexico',\n", + " 'Tieton, Washington, United States',\n", + " 'Timsbury, Somerset, England',\n", + " 'Timsbury, Somerset, Scotland',\n", + " 'Tipperary, Ireland',\n", + " 'Tomales, California, United States',\n", + " 'Treviso, Veneto, Italy',\n", + " 'Troyes , Aube, France',\n", + " 'Tuscany, Italy',\n", + " 'Umbria, Lazio, Italy',\n", + " 'Upper Corsica, France',\n", + " 'Utah, United States',\n", + " 'Valencia, Spain',\n", + " 'Valpadana, Italy',\n", + " 'Veneto, ',\n", + " 'Veneto, Italy',\n", + " 'Veneto, Trentino, Italy',\n", + " 'Vermont, United States',\n", + " 'Victoria, Australia',\n", + " 'Virginia, United States',\n", + " 'Vorarlberg, Austria',\n", + " 'Västra Götaland, Sweden',\n", + " 'Wales, Great Britain',\n", + " 'Wales, London, Wales',\n", + " 'Wallonia, Belgium',\n", + " 'Websterville, VT, United States',\n", + " 'West Bengal, India',\n", + " 'West Pawlet, VT, United States',\n", + " 'Wigtownshire, Scotland',\n", + " 'Wisconsin, United States',\n", + " 'Zasavica, Serbia',\n", + " 'island wide, Cyprus',\n", + " 'massif des Causses, France',\n", + " 'old Liburnia (Dalmatia), Croatia',\n", + " 'province of Brittany, France',\n", + " 'Äänekoski, Finland'}" ] }, - "execution_count": 49, + "execution_count": 55, "metadata": {}, "output_type": "execute_result" } ], "source": [ + "locs=set(data[\"location\"])\n", "locs" ] }, { "cell_type": "code", - "execution_count": 40, - "id": "debb780e-ec13-4502-ac44-6001335e507d", + "execution_count": null, + "id": "f3bb9a47-56fa-49c4-8761-0db015944446", "metadata": {}, "outputs": [], - "source": [ - "from geopy.geocoders import Nominatim" - ] - }, - { - "cell_type": "code", - "execution_count": 41, - "id": "eed3ac7b-5283-4d8e-bc26-61e1d821ccaf", - "metadata": {}, - "outputs": [], - "source": [ - "geolocator=Nominatim(user_agent=\"toto\")" - ] - }, - { - "cell_type": "code", - "execution_count": 48, - "id": "0043fe0d-e2d2-48f0-8953-ffc3dee52ba6", - "metadata": {}, - "outputs": [], - "source": [ - "location=geolocator.geocode(locs[1])" - ] + "source": [] }, { "cell_type": "code", "execution_count": null, + "id": "debb780e-ec13-4502-ac44-6001335e507d", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "eed3ac7b-5283-4d8e-bc26-61e1d821ccaf", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 69, + "id": "0043fe0d-e2d2-48f0-8953-ffc3dee52ba6", + "metadata": {}, + "outputs": [], + "source": [ + "def str_to_gps(loc):\n", + " l=loc.split(\",\")\n", + " loc=\",\".join([l[0],l[-1]])# removing details gives less errors while fetching the GPS coordinates\n", + " try:\n", + " res=Nominatim(user_agent=\"dmProject\").geocode(loc) \n", + " return (res.latitude, res.longitude)\n", + " except AttributeError:\n", + " loc=l[-1]\n", + " res=Nominatim(user_agent=\"dmProject\").geocode(loc) \n", + " return (res.latitude, res.longitude)" + ] + }, + { + "cell_type": "code", + "execution_count": 70, "id": "710341db-408f-4a4a-a849-65b963582ebc", "metadata": {}, "outputs": [ { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "a2bbdb40ac6c43b0bfe08d014970db40", + "model_id": "b78765c7ef7a4fad8cb4520512a198c8", "version_major": 2, "version_minor": 0 }, "text/plain": [ - " 0%| | 0/430 [00:00, ?it/s]" + " 0%| | 0/390 [00:00, ?it/s]" ] }, "metadata": {}, @@ -2793,195 +3035,563 @@ "name": "stdout", "output_type": "stream", "text": [ - "Oristano, Italy\n", - "Isere, France\n", - "Romanian Carpathians, Romania\n", - "French Basque Country, Midi-Pyrénées, France\n", - "ERREUR\n", - "Kilmallock County Limerick, Ireland\n", - ", Australia\n", - "massif des Causses, France\n", - "ERREUR\n", - "Basque, Pyrenees Mountains, France\n", - "ERREUR\n", - "Modena, Italy\n", - "Vermont, United States\n", - "Rhone-Alps, France\n", - "Brooklyn NY, United States\n", - "Coast of Oregon, United States\n", - "ERREUR\n", - "Veneto, Trentino, Italy\n", - "ERREUR\n", - "Emilia Romagna, Italy\n", - ", Middle East\n", - "Carmarthenshire, Wales\n", - ", Egypt, Lebanon, Syria\n", - "ERREUR\n", - "Jura, Switzerland\n", - ", Australia, France\n", - "Rio Grande do Sul, Brazil\n", - ", Turkey\n", - "Banks Peninsular in Canterbury, New Zealand\n", - "ERREUR\n", - "Loire Valley, France\n", - "Berry, France\n", - "Seattle, Washington, United States\n", - "Marathon, NY, United States\n", - "Setubal, Palmela and Sesimbra, Portugal\n", - "ERREUR\n", - "Central Balkan Mountains, Bulgaria\n", - "ERREUR\n", - "North Wootton, England\n", - "Allagau, Bavarian Alps, Germany\n", - "ERREUR\n", - "Colorado, United States\n", - ", Armenia\n", - "Lebanon, CT, United States\n", - "Centre-Val de Loire, France\n", - "Barcelona, Spain\n", - "South West England, England\n", - "Laqueuille, France\n", - "Fethard, Co Tipperary, Ireland\n", - "Mornington Peninsula, Melbourne, Australia\n", - "Odell, Bedfordshire, England, Great Britain, United Kingdom\n", - "ERREUR\n", - "Shelburne Farms, United States\n", - ", Israel\n", - "South Australia, Australia\n", - "Bornholm, Denmark\n", - "Pyrénées, France\n", - "Sardinia & Campania, Italy\n", - "ERREUR\n", - "Hunter Valley, Australia\n", - "Greenville, Indiana, United States\n", - "Pokolbin, Hunter Valley, Australia\n", - "ERREUR\n", - "Landford, England, Great Britain, United Kingdom\n", - "ERREUR\n", - "Carrigtwohill, Ireland\n", - "Minnesota, United States\n", - "Lombardy, Italy\n", - "County Cavan, Ireland\n", - ", Argentina\n", - ", France\n", - "Avila, Spain\n", - "Crotone, Italy\n", - "New Hampshire, United States\n", - ", Serbia\n", - "Lombardy, Canada, Italy\n", - "ERREUR\n", - "Pays d’Auge, Normandy, France\n", - "Wisconsin, United States\n", - "Tomales, California, United States\n", - ", Netherlands\n", - "Serra da Estrela, Portugal\n", - "St. Gallen (canton), Tufertschwil, Switzerland\n", - "ERREUR\n", - "Extremadura, Spain\n", - ", Spain\n", - "Pesaro-Urbino, Italy\n", - "New York, France, United States\n", - "ERREUR\n", - "Northern Holland, Netherlands\n", - "ERREUR\n", - "South West England, United Kingdom\n", - "Mankato, MN, United States\n", - "Charentes-Poitou, France\n", - "Postel, Belgium\n", - "Auvergne, Salers, France\n", - "Leiden, Netherlands\n", - "Apulia, Italy, United States\n", - "ERREUR\n", - ", Afghanistan\n", - "Canary Islands, Spain\n", - ", Great Britain, United Kingdom, Wales\n", - "ERREUR\n", - "Oregon Coast Range, United States\n", - "ERREUR\n", - "Calabria, Italy\n", - "Utah, United States\n", - "Gâtinais, France\n", - "North Yorkshire, England\n", - "Carnia, Italy\n", - "Passendale, Belgium\n", - "Lucerne, Schwyz, Unterwald, and Zoug, and the following additional places: Muri district in d'Argovi, Switzerland\n", - "ERREUR\n", - "Carrigtwohill, \n", - "Adamstown, Co Wexford, Ireland\n", - "Bermondsey, London, England, Great Britain, United Kingdom\n", - "ERREUR\n", - "Lapland, Finland\n", - "Tasmania, Australia\n", - "Staffordshire, England, Great Britain, United Kingdom\n", - "ERREUR\n", - "Ile de France, France\n", - "Lodi, Italy\n", - "Macedonia, Thrace, Thessalia, Peloponissos, Ionian Islands, Aegean islands, Crete Island and Epirus, Greece\n", - "ERREUR\n", - ", United Kingdom, United States\n", - "Southern California, United States\n", - "South West England, England, United Kingdom\n", - "Haute Vienne, France\n", - "Menorca, Balearic Islands, Spain\n", - "Aberdeenshire, Scotland\n", - "Kimball, United States\n", - "Schoonrewoerd, Leerdam, Netherlands\n", - "ERREUR\n", - "Friuli-Venezia Giulia, Italy\n", - "Larzac, France\n", - "Nottinghamshire, England, Great Britain, United Kingdom\n", - "ERREUR\n", - "Charm, Ohio, United States\n", - "Troyes , Aube, France\n", - ", Denmark, Finland, Germany, Iceland, Norway, Sweden\n", - "ERREUR\n", - "Québec, Canada\n", - "Herault, France\n", - "Pullman, Washington, United States\n" + "Valencia, Spain (39.4697065, -0.3763353)\n", + "Crotone, Italy (39.1873894, 16.87828188895307)\n", + "New Hampshire, United States (43.4849133, -71.6553992)\n", + "Setubal, Palmela and Sesimbra, Portugal (38.5241783, -8.8932341)\n", + ", Turkey (39.294076, 35.2316631)\n", + "Wisconsin, United States (44.4308975, -89.6884637)\n", + "Maine, United States (45.709097, -68.8590201)\n", + "Beara Peninsula, Co. Cork, Ireland (51.7280451, -9.767906428362338)\n", + "Castilla Leon, Spain (40.4598868, -3.4720773)\n", + ", Wales (52.2928116, -3.73893)\n", + "Romanian Carpathians, Romania (46.4046483, 22.9894841933513)\n", + "Pembrokeshire, Wales (51.8339209, -4.916667)\n", + "Lodi, Italy (45.2613104, 9.491678060021837)\n", + "Stoneyford, Ireland (52.5362671, -7.2278963)\n", + "Central and Western Macedonia, Thessaly, Greece (38.9953683, 21.9877132)\n", + ", Armenia (4.536307, -75.6723751)\n", + "Indiana, United States (40.3270127, -86.1746933)\n", + "Alba, Italy (44.7007236, 8.0357786)\n", + "East Sussex, United Kingdom (50.9404266, 0.3699977891068864)\n", + "Fornells de la Selva, Gironès, Spain (41.9319675, 2.8090343)\n", + ", Iraq (33.0955793, 44.1749775)\n", + "Treviso, Veneto, Italy (45.806691349999994, 12.206315763116372)\n", + ", Brazil (-10.3333333, -53.2)\n", + "North Wootton, England (52.7923213, 0.4278194)\n", + "Modena, Italy (44.5384728, 10.935960870530739)\n", + "Minas Gerais, Brazil (-18.5264844, -44.1588654)\n", + "Emilia-Romagna, Italy (44.525696, 11.039437)\n", + "Centre-Val de Loire, France (47.5490251, 1.7324062)\n", + "Dumfriesshire, Scotland (55.166667, -3.5)\n", + "Brisbane, Australia (-27.4689682, 153.0234991)\n", + "Carrigtwohill, (51.9094617, -8.2611809)\n", + "Azores, Portugal (37.80855645, -25.473137391245295)\n", + ", Austria (47.59397, 14.12456)\n", + "Basque, Pyrenees Mountains, France (45.359277750000004, -1.1480053453043046)\n", + "North East Victoria, (54.699881, -1.6031519)\n", + "Greensboro, VT, United States (36.0726355, -79.7919754)\n", + "Stawley, near Wellington, Somerset, England (50.9961449, -3.3382702)\n", + "Central and Western Macedonia, Thessalia, Greece (38.9953683, 21.9877132)\n", + "Po valley region, Italy (42.6384261, 12.674297)\n", + "Southwestern Wisconsin, United States (42.53116075, -90.43762550236468)\n", + "County Wexford, Ireland (52.46018745, -6.606515459159162)\n", + "Valpadana, Italy (39.60288591417616, 16.626802703803317)\n", + "Lapland, Finland (67.69291045, 26.728214183162986)\n", + ", United States (39.7837304, -100.445882)\n", + "Passendale, Belgium (50.9003015, 3.0203891)\n", + "Dorset, England (50.79683685, -2.34473226124306)\n", + "Chirac, France (45.9140138, 0.6548543)\n", + "North Carolina, United States (35.6729639, -79.0392919)\n", + "Umbria, Lazio, Italy (42.965916, 12.490236)\n", + "Iowa, United States (41.9216734, -93.3122705)\n", + "Inagh, Co Clare, (52.9071704, -9.2345138)\n", + "Roxburghshire, Scotland (56.7861112, -4.1140518)\n", + "Sardegna, Italy (40.0912813, 9.0305773)\n", + "province of Brittany, France (46.603354, 1.8883335)\n", + "Troyes , Aube, France (48.2971626, 4.0746257)\n", + "Carneros, Sonoma, California, United States (33.223027, -111.70568456233669)\n", + "Svaneti, Samegrelo, Georgia (42.63545205, 42.24871384619953)\n", + "La Velle, Wisconsin, United States (45.1699553, -109.88428658948227)\n", + "Georgia, United States (32.3293809, -83.1137366)\n", + "Brickhill, Co. Clare, Ireland (52.70642975, -8.751786760846851)\n", + "Sulzberg, Austria (47.52121792021591, 9.91273065974192)\n", + "Nicasio, United States (38.0615885, -122.6985975)\n", + "Inagh, Co Clare, Ireland (52.9071704, -9.2345138)\n", + "Burgundy, France (47.27808725, 4.222486304306048)\n", + "Aveyron, Laguiole, France (44.315857449999996, 2.5065697302419823)\n", + "Centre , the department of Loiret, France (47.5490251, 1.7324062)\n", + "Rhone Valley, France (46.603354, 1.8883335)\n", + "Tasmania, Australia (-42.035067, 146.6366887)\n", + "South West England, United Kingdom (51.0339991, -2.949011916021195)\n", + ", Canada (61.0666922, -107.991707)\n", + "Loire Valley, France (47.44927715, -0.34954901296919916)\n", + "Extremadura, Spain (39.1748426, -6.1529891)\n", + "New Jersey, United States (40.0757384, -74.4041622)\n", + "Nord-Pas-de-Calais, France (50.5289634, 2.454515765955904)\n", + "Piave Valley, Italy, Italy (45.735099578237005, 7.320173335891282)\n", + "Friuli-Venezia Giulia and the Veneto, Italy (42.6384261, 12.674297)\n", + "Co. Cork, Ireland (51.917535900000004, -8.58597726870895)\n", + "North Yorkshire, England (54.13453275, -1.498628491239545)\n", + "Illinois, United States (40.0796606, -89.4337288)\n", + "Gâtinais, France (48.15497515, 2.811419156673292)\n", + "Campania, Paestum, Foggia, Italy (40.860672, 14.843984)\n", + "Port Townsend, United States (48.1179702, -122.769544)\n", + "Piemonte, Italy (45.060735, 7.923549)\n", + "Bregenzerwald, Kleinwalsertal, Großwalsertal, Laiblachtal (Pfänderstock) and Rheintal, Austria (47.387028799999996, 9.95606355528393)\n", + "Brooklyn NY, United States (40.6526006, -73.9497211)\n", + "Avesnes, France (50.5495906, 1.9721295)\n", + "Petaluma, California, United States (38.2325829, -122.636465)\n", + "Lanarkshire, Scotland (55.5752966, -3.833333)\n", + "Co Clare, Ireland (52.857257450000006, -8.937435925994537)\n", + "Mankato, MN, United States (44.1634663, -93.9993505)\n", + "Friuli Venezia Giulia and Veneto, Italy (42.6384261, 12.674297)\n", + "Québec, Canada (52.4760892, -71.8258668)\n", + "Airedale farming district, New Zealand (-41.5000831, 172.8344077)\n", + "Galicia, Spain (42.61946, -7.863112)\n", + "Campania, Italy (40.860672, 14.843984)\n", + "Asiago, Italy (45.8753771, 11.5106998)\n", + "Monterey, California, United States (36.2231079, -121.387742)\n", + "Pullman, Washington, United States (46.7304268, -117.173895)\n", + "Devon, England (50.724140500000004, -3.6607788161410735)\n", + "Pesaro-Urbino, Italy (43.694112700000005, 12.701443660480004)\n", + "Ballarat, Victoria, Australia (-37.5623013, 143.8605645)\n", + "Savoie, France (45.494895150000005, 6.384660381375652)\n", + "Hunter Valley, Australia (-32.5421803, 151.2185641)\n", + "Auvergne, Salers, France (45.2968119, 4.6604809)\n", + "Chelmarsh, Bridgnorth, Shropshire, England (52.4875359, -2.4124407)\n", + "Duhallow, Ireland (52.1837912, -9.00609563330653)\n", + ", Serbia (44.024322850000004, 21.07657433209902)\n", + "Stranraer, Scotland (54.9044332, -5.026204)\n", + "Cotswolds, England (51.74894260792542, -0.23033349985221635)\n", + "Manitoba, Canada (55.001251, -97.001038)\n", + "South West England, England (51.50076785, -2.5503106339491204)\n", + "Berry, France (44.5760186, 0.3095833)\n", + "Co Limerick, Ireland (52.518831649999996, -8.795834650292788)\n", + "Averyon, France (46.603354, 1.8883335)\n", + "Co. Mayo, Ireland (53.9087056, -9.298304863654256)\n", + "Corsica, France (42.188089649999995, 9.068413771427695)\n", + "Moliterno, Italy (40.2423024, 15.868903)\n", + "Castelo Branco, Fundão and Idanha-a-Nova, Portugal (39.97675825, -7.446059929966704)\n", + "Oristano, Italy (40.02656765, 8.679641647435716)\n", + "Postel, Belgium (51.2874865, 5.1897863)\n", + ", Iceland (64.9841821, -18.1059013)\n", + "Brittany, France (48.2640845, -2.9202408)\n", + "Rio Grande do Sul, Brazil (-29.8425284, -53.7680577)\n", + "Greenville, Indiana, United States (34.851354, -82.3984882)\n", + "Macedonia, Thrace, Thessalia, Peloponissos, Ionian Islands, Aegean islands, Crete Island and Epirus, Greece (40.6186482, 22.91795361795959)\n", + "Shelburne Farms, United States (34.89046225, -82.24340593189123)\n", + "Provencale, France (43.7899311033635, 7.524017533510311)\n", + "Oxfordshire, Great Britain (51.7412674, -1.2245951)\n", + "Swabia, Germany (48.15313125, 10.47129100603846)\n", + "Comox Valley, Vancouver Island, Canada (49.670981, -125.0353253)\n", + "Dalmatia, Croatia (43.538796500000004, 16.175235566874342)\n", + "Murcia, Spain (37.9923795, -1.1305431)\n", + "Puimichel in Provence Alpes, France (46.603354, 1.8883335)\n", + "Peekskill, United States (41.289811, -73.9204922)\n", + "Menorca, Balearic Islands, Spain (39.949257200000005, 4.0499641751186415)\n", + "New South Wales, Australia (-31.8759835, 147.2869493)\n", + "Colorado, United States (38.7251776, -105.607716)\n", + "Piora Valley, Switzerland (46.7985624, 8.2319736)\n", + "Loire, France (45.75385355, 4.045473682551104)\n", + "Tieton, Washington, United States (46.7020686, -120.75535)\n", + "Oviken, Sweden (62.9974877, 14.3928671)\n", + "Taxco, Mexico (18.5565446, -99.6052838)\n", + "Rhône-Alpes, France (45.3175313, 5.721294352585611)\n", + ", Mexico and Caribbean ERROR\n", + "Bursa, Turkey (39.9895878, 28.8944669)\n", + "Nottinghamshire, England (53.1459288, -1.0214971168122484)\n", + "Karlovy Vary, Czech Republic (50.2306216, 12.8701437)\n", + "County Cavan, Ireland (54.03497495, -7.2937022825583675)\n", + "Northwest, United States (34.3129464, -78.1611077)\n", + ", Germany (51.1638175, 10.4478313)\n", + ", Sweden (59.6749712, 14.5208584)\n", + ", Argentina (-34.9964963, -64.9672817)\n", + "Queenstown, New Zealand (-45.0321923, 168.661)\n", + "All Holland, Netherlands (52.4601118, 4.6056526)\n", + "Flanders, Belgium (51.096246199999996, 4.178629103169916)\n", + "West Pawlet, VT, United States (43.356893, -73.24966776033015)\n", + "Bjurholm, Sweden (63.966667, 19.0)\n", + "Allgaeu Alps, Germany (51.1638175, 10.4478313)\n", + "Somerset, England (51.161750850000004, -3.0753867062227487)\n", + "Herefordshire, West Midlands, United Kingdom (52.083333, -2.75)\n", + "Västra Götaland, Sweden (58.215850200000006, 12.651820794914073)\n", + ", Scotland (56.7861112, -4.1140518)\n", + "Provence, France (44.0580563, 6.0638506)\n", + "Mornington Peninsula, Melbourne, Australia (-38.3312575, 145.08106868543985)\n", + "Haute-Savoie / Upper Savoy, France (46.06904065, 6.344532137164)\n", + ", Middle East (39.3014159, -76.5888477)\n", + "Sonoma, California, United States (38.5110803, -122.8473388)\n", + "Veneto, Italy (45.6476663, 11.8665254)\n", + "Haute Vienne, France (45.91901925, 1.203176771876291)\n", + "Gloucestershire County, England (51.9425914, -2.100154122305389)\n", + "Massachusetts, United States (42.3788774, -72.032366)\n", + "Carmarthenshire, Wales (51.893669849999995, -4.217282721429928)\n", + "Orkney Isles, Scotland (56.7861112, -4.1140518)\n", + ", Belgium (50.6402809, 4.6667145)\n", + "Lombardy, Italy (45.5703694, 9.7732524)\n", + "Oregon, United States (43.9792797, -120.737257)\n", + "Cheshire, England (53.2141028, -2.471770086071205)\n", + "Blarney, Ireland (51.9325233, -8.5678665)\n", + "Timsbury, Somerset, England (51.3271927, -2.4755923)\n", + "Veneto, Trentino, Italy (45.6476663, 11.8665254)\n", + "Co. Offaly, Ireland (53.13617215, -7.810340751784169)\n", + "Barcelona, Spain (41.3828939, 2.1774322)\n", + "Sardinia & Campania, Italy (42.6384261, 12.674297)\n", + "West Bengal, India (22.9964948, 87.6855882)\n", + "Banon, France (44.0381752, 5.6296701)\n", + "Laruns, France (42.9882368, -0.4266324)\n", + "Gevrey-Chambertin, Burgundy, France (47.2261857, 4.9705666)\n", + "Pyrenees, France (48.8738565, 2.3852638)\n", + "Murazzano, Italy (44.4746494, 8.0213361)\n", + "Southern California, United States (34.169262950000004, -116.787448181486)\n", + "Normandy, France (49.0677708, 0.3138532)\n", + "Charentes, France (45.4039367, 0.3756199)\n", + "island wide, Cyprus (34.9174159, 32.889902651331866)\n", + "Larzac, France (44.74693, 1.0075)\n", + "Pays d’Auge, Normandy, France (49.0356178, 0.1573083324015645)\n", + "Pyrenees-Atlantiques, France (43.18718655, -0.728247400084667)\n", + "Auvergne, France (45.2968119, 4.6604809)\n", + "Burgund, France (47.27808725, 4.222486304306048)\n", + ", Portugal (39.6621648, -8.1353519)\n", + "Jura, Switzerland (47.3566699, 7.1598893)\n", + "Emilia Romagna, Italy (44.525696, 11.039437)\n", + "East Midlands, England (53.1188177, -1.2597068974971675)\n", + "Missouri, United States (38.7604815, -92.5617875)\n", + "Marathon, NY, United States (44.8914036, -89.7748098)\n", + ", Holland (52.2434979, 5.6343227)\n", + "Ann Arbor, MI, United States (42.2813722, -83.7484616)\n", + "Cevenes, France (44.3509309, 3.8584812791602983)\n", + "Bergues, France (50.9683886, 2.4325247)\n", + "Pokolbin, Hunter Valley, Australia (-32.7792106, 151.2978747)\n", + "Pyrénées, France (48.8738565, 2.3852638)\n", + ", Netherlands (52.2434979, 5.6343227)\n", + "Gippsland, Victoria, Australia (-37.87448275, 146.9111788341666)\n", + "Cumbrian, United Kingdom (54.478530449999994, -3.06553306667584)\n", + "Friuli-Venezia Giulia, Italy (46.151042, 13.055904)\n", + "Kilmallock County Limerick, Ireland (52.400645600000004, -8.571161660434711)\n", + "Gloucestershire, England (51.7643786, -2.1880661838719386)\n", + "Vermont, United States (44.5990718, -72.5002608)\n", + "Stewarton, Scotland (55.680265, -4.5153023)\n", + "Leiden, Netherlands (52.1594747, 4.4908843)\n", + "Lebanon, CT, United States (40.375713, -76.4626118)\n", + "Tomales, California, United States (38.2468075, -122.90630461024097)\n", + "Bermondsey, London, England (51.4970125, -0.063268)\n", + "Tipperary, Ireland (52.4734839, -8.1614446)\n", + "Fife, Scotland (56.3333331, -3.0000001)\n", + "Allgäu, Germany (47.5926009, 10.209156)\n", + ", France (46.603354, 1.8883335)\n", + "French Basque Country, Midi-Pyrénées, France (46.603354, 1.8883335)\n", + "Severn Valley, England (52.454530899999995, -2.3755702502240226)\n", + ", Denmark (55.670249, 10.3333283)\n", + "Tain, Scotland (57.8119372, -4.0550663)\n", + "New York, France (44.8712241, -0.5502475)\n", + "Pyrénées-Atlantiques, France (43.18718655, -0.728247400084667)\n", + "Buxton, Derbyshire, England (53.2593422, -1.9100768)\n", + "Galax, Virginia, United States (36.6612387, -80.9239671)\n", + "Wallonia, Belgium (50.154540049999994, 5.399359762971196)\n", + "Ile-de-France/Champagne, France (48.5499711, 7.7508704)\n", + "Lazio, Sardinia, Italy (41.9808038, 12.7662312)\n", + "Staffordshire, England (52.824694199999996, -2.0074546723348115)\n", + ", Switzerland (46.7985624, 8.2319736)\n", + "Serra da Estrela, Portugal (40.4358994, -7.516865473467464)\n", + "County Carlow, Ireland (52.69078865, -6.825145150844913)\n", + "St. Louis, Missouri, United States (38.6280278, -90.1910154)\n", + "Coquet, England (54.88091196980861, -1.5495607774216265)\n", + "Béarnaise in Pyrénées-Atlantique, France (46.603354, 1.8883335)\n", + "Websterville, VT, United States (44.162985, -72.47576806895253)\n", + ", Poland (52.215933, 19.134422)\n", + "Utah, United States (39.4225192, -111.714358)\n", + "Allagau, Bavarian Alps, Germany (51.1638175, 10.4478313)\n", + "Oregon Coast Range, United States (39.7837304, -100.445882)\n", + "Cotherstone, England (54.570244, -1.9804176)\n", + "Swaledale, North Yorkshire, England (54.38299324007608, -1.9841360652878535)\n", + "Bornholm, Denmark (55.143122399999996, 14.922629658767558)\n", + "Aquitaine, France (44.24620635, -0.18399787392367906)\n", + "old Liburnia (Dalmatia), Croatia (45.3658443, 15.6575209)\n", + "Fethard, Co Tipperary, Ireland (52.467222, -7.691111)\n", + "Northern Holland, Netherlands (52.2434979, 5.6343227)\n", + "Castile-Leon, Spain (41.55005, -5.1387401)\n", + "Naples, Italy (40.8358846, 14.2487679)\n", + "Gravina in Puglia, Murgia, Italy (40.819725, 16.422779)\n", + "Castille-Leon, Spain (41.55005, -5.1387401)\n", + ", Israel (30.8124247, 34.8594762)\n", + "Languedoc-Roussillon, France (43.65420305, 3.674669940206605)\n", + "Orkney Islands, Scotland (58.94182309999999, -3.129694439563327)\n", + ", Italy (42.6384261, 12.674297)\n", + ", United Kingdom (54.7023545, -3.2765753)\n", + "Wales, Great Britain (53.28236125, -3.8286207326666837)\n", + "Wales, London, Wales (52.41446365, -4.0685073132923)\n", + "California, United States (36.7014631, -118.755997)\n", + "Belvederis, Lithuania (55.0820118, 23.3897023)\n", + "Franche Comté, France (48.68347355, 2.1776625116070027)\n", + "Kent, United Kingdom (51.20707485, 0.7210361813401444)\n", + "Bloomdale, United States (33.2473378, -96.6794382)\n", + "Wigtownshire, Scotland (54.9042579, -5.0248893)\n", + ", Ireland (52.865196, -7.9794599)\n", + "County Tipperary, Clogheen, Ireland (52.68482145, -7.898147186112796)\n", + "Colby, Wisconsin, United States (44.5684775, -69.66002565150262)\n", + "Isere, France (45.28979315, 5.634382477386232)\n", + "Kinfauns, Perthshire, Scotland (56.3822607, -3.36565)\n", + ", Mexico (23.6585116, -102.0077097)\n", + "Dumfries, Scotland (55.0691397, -3.6107936)\n", + "Odell, Bedfordshire, England (52.21843025, -0.5921260787763352)\n", + "Avila, Spain (40.656478, -4.7002172)\n", + "Bethania, United Kingdom (52.2509586, -4.0888576)\n", + "Lincolnshire, England (53.1823034, -0.2031208542548153)\n", + "Hamilton, New Zealand (-37.7878809, 175.281788)\n", + ", Greece (38.9953683, 21.9877132)\n", + "New York, United States (40.7127281, -74.0060152)\n", + ", Cyprus (34.9174159, 32.889902651331866)\n", + "South Australia, Australia (-30.5343665, 135.6301212)\n", + "Low-laying regions, Sweden (59.6749712, 14.5208584)\n", + "Serra da Canastra, Minas Gerais state, Brazil (-20.1615, -46.76365461658604)\n", + "Cornwall, (50.443348900000004, -4.62465658489158)\n", + "St Antoine, France (44.0361186, 0.8397552)\n", + "Amou, Gascony, France (43.59266, -0.7475291)\n", + "Charentes-Poitou, France (45.4039367, 0.3756199)\n", + "Co. Carlow, Ireland (52.69078865, -6.825145150844913)\n", + "Äänekoski, Finland (62.6032186, 25.7301361)\n", + ", Spain (39.3260685, -4.8379791)\n", + "Ile de France, France (48.6443057, 2.7537863)\n", + "Seattle, Washington, United States (47.6038321, -122.330062)\n", + "Minnesota, United States (45.9896587, -94.6113288)\n", + "Milford, NJ, United States (41.2222218, -73.0570603)\n", + "Charm, Ohio, United States (40.5067308, -81.7848553)\n", + "Anjou, France (45.3462, 4.88149)\n", + "Pinconning, Michigan, United States (43.853633, -83.964987)\n", + "Derbyshire, Leicestershire, Nottinghamshire, England (53.1666927, -1.5833223)\n", + "Gujarat, India (22.3850051, 71.745261)\n", + ", Mongolia (46.8250388, 103.8499736)\n", + "Central Balkan Mountains, Bulgaria (42.6073975, 25.4856617)\n", + "Schoonrewoerd, Leerdam, Netherlands (51.920458, 5.1156505)\n", + "North East Victoria, Australia (-37.8633951, 145.0100994)\n", + "Bavaria, Germany (48.9467562, 11.4038717)\n", + "Kimball, United States (41.1881305, -103.6997645)\n", + "Illoud (Haute-Marne), France (48.2089823, 5.5615126)\n", + "Ann Arbor, Michigan, United States (42.2813722, -83.7484616)\n", + "Rhone-Alps, France (45.2968119, 4.6604809)\n", + "Mols, Denmark (56.187042, 10.460782482125193)\n", + "Island of Pag, Croatia (45.3658443, 15.6575209)\n", + ", Hungary (47.1817585, 19.5060937)\n", + "Lower Normandy, France (48.953684499999994, -0.573365358805311)\n", + "Midi-Pyrenees, France (43.8099068, 1.4344926056549236)\n", + "Huizen, Netherlands (52.2958122, 5.2567209)\n", + "Upper Corsica, France (46.603354, 1.8883335)\n", + "Basilicata, Italy (40.500571, 16.081953)\n", + "Landford, England (50.9700788, -1.6363792)\n", + "Maribo, Denmark (54.7758018, 11.5054333)\n", + "Virginia, United States (37.1232245, -78.4927721)\n", + "Adamstown, Co Wexford, Ireland (53.3360017, -6.4692321)\n", + "Het Groene Hart, Netherlands (51.5246, 4.280818038775446)\n", + "Sebastopol, California, United States (38.4021038, -122.824222)\n", + "Carrigtwohill, Ireland (51.9094617, -8.2611809)\n", + "County Antrim, Ireland (54.864725500000006, -6.143637910742768)\n", + "Aberdeenshire, Scotland (57.166667, -2.666667)\n", + "massif des Causses, France (46.603354, 1.8883335)\n", + "Asturias, Spain (43.3133868, -5.94192)\n", + "Allgau, Germany (47.8241593, 11.6822424)\n", + "Croisy-sur-Eure, France (49.0291802, 1.346505)\n", + "Northern Wisconsin, United States (44.94725995, -91.39373410986752)\n", + "Carnia, Italy (46.3738716, 13.1339829)\n", + "Vorarlberg, Austria (47.25, 9.9166667)\n", + "Quebec, Canada (52.4760892, -71.8258668)\n", + "Canary Islands, Spain (28.286398900000002, -16.796011808910734)\n", + "Banks Peninsular in Canterbury, New Zealand (-41.5000831, 172.8344077)\n", + "Beira Baixa Province, Portugal (39.6621648, -8.1353519)\n", + "Fairview, United States (40.6333724, -90.1637318)\n", + "Aconcagua, Chile (-33.04383715040669, -71.56622455102398)\n", + "Midi-Pyrénées, France (43.8099068, 1.4344926056549236)\n", + "Landshut, Germany (48.536217, 12.1516551)\n", + ", New Zealand (-41.5000831, 172.8344077)\n", + ", England (52.5310214, -1.2649062)\n", + "Languedoc, France (43.65420305, 3.674669940206605)\n", + ", Afghanistan (33.7680065, 66.2385139)\n", + "NY, United States (43.1561681, -75.8449946)\n", + "Northeastern Brazil, Brazil (-10.3333333, -53.2)\n", + "Piedmont, Italy (45.060735, 7.923549)\n", + "St. Gallen (canton), Tufertschwil, Switzerland (47.1561047, 9.338323)\n", + "Pembrokeshire, United Kingdom (51.8339209, -4.916667)\n", + "Canton of Glarus, Switzerland (46.7985624, 8.2319736)\n", + "South East England, United Kingdom (51.45115235, -0.9935673736185868)\n", + "Ceredigion, United Kingdom (52.2945764, -3.9527809990291427)\n", + "Stonegate, East Sussex, England (53.960910892985034, -1.0833748506182423)\n", + "Tuscany, Italy (43.4586541, 11.1389204)\n", + "Timsbury, Somerset, Scotland (56.7861112, -4.1140518)\n", + "Lucerne, Schwyz, Unterwald, and Zoug, and the following additional places: Muri district in d'Argovi, Switzerland (47.0505452, 8.3054682)\n", + "Prince Edward Island, Canada (46.3355508, -63.1466676)\n", + "Prince Edward County, Ontario, Canada (44.031827, -77.246933)\n", + "Aveyron, France (44.315857449999996, 2.5065697302419823)\n", + "Calabria, Italy (39.0565974, 16.5249864)\n", + "British Columbia, Canada (55.001251, -125.002441)\n", + "Ontario, Canada (50.000678, -86.000977)\n", + "North Cornwall, England (51.7561518, 0.4645198)\n", + "Pennsylvania, United States (40.9699889, -77.7278831)\n", + "Coast of Oregon, United States (39.7837304, -100.445882)\n", + "Veneto, (45.6476663, 11.8665254)\n", + ", Australia (-24.7761086, 134.755)\n", + "Victoria, Australia (-36.5986096, 144.6780052)\n", + "Pays Basque, France (47.6867895, 7.3927627)\n", + ", Mauritania (20.2540382, -9.2399263)\n", + "Richfield, Wisconsin, United States (44.8766431, -93.2877877)\n", + "Poitou-Charentes, France (46.13244785, -0.15455354898441043)\n", + "Pienza, Italy (43.0765485, 11.6789076)\n", + "Herault, France (43.591422, 3.3553309364095925)\n", + "Normandy, Auvilliers, France (49.0677708, 0.3138532)\n", + "Bourgogne, France (47.27808725, 4.222486304306048)\n", + "Póvoa de Lanhoso, Portugal (41.5759516, -8.2699521)\n", + "Cornwall, England (50.416667, -4.75)\n", + "Roncq, France (50.7531232, 3.1209016)\n", + "Laqueuille, France (45.6507627, 2.7320917)\n", + "Bas-Languedoc, Comtat Venaissin, France (43.687621, 4.2691037)\n", + "Zasavica, Serbia (44.9454307, 19.4987239)\n" ] } ], "source": [ - "import time\n", - "import tqdm.notebook as tqdm\n", - "import random\n", - "locations=[]\n", + "locations_to_gps={}\n", + "errors=set()\n", "for loc in tqdm.tqdm(locs):\n", - " print(loc)\n", " time.sleep(1)\n", - " locations.append(Nominatim(user_agent=\"toto\").geocode(loc))\n", " try:\n", - " locations[-1]=locations[-1].latitude,locations[-1].longitude\n", - " except AttributeError:print(\"ERREUR\")" + " locations_to_gps[loc]=str_to_gps(loc)\n", + " print(loc, locations_to_gps[loc])\n", + " except AttributeError:\n", + " print(loc, \"ERROR\")\n", + " errors.add(loc)" + ] + }, + { + "cell_type": "code", + "execution_count": 71, + "id": "a6966ac7-7a69-4829-8588-d10f85ea98a4", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "{'Valencia, Spain': (39.4697065, -0.3763353), 'Crotone, Italy': (39.1873894, 16.87828188895307), 'New Hampshire, United States': (43.4849133, -71.6553992), 'Setubal, Palmela and Sesimbra, Portugal': (38.5241783, -8.8932341), ', Turkey': (39.294076, 35.2316631), 'Wisconsin, United States': (44.4308975, -89.6884637), 'Maine, United States': (45.709097, -68.8590201), 'Beara Peninsula, Co. Cork, Ireland': (51.7280451, -9.767906428362338), 'Castilla Leon, Spain': (40.4598868, -3.4720773), ', Wales': (52.2928116, -3.73893), 'Romanian Carpathians, Romania': (46.4046483, 22.9894841933513), 'Pembrokeshire, Wales': (51.8339209, -4.916667), 'Lodi, Italy': (45.2613104, 9.491678060021837), 'Stoneyford, Ireland': (52.5362671, -7.2278963), 'Central and Western Macedonia, Thessaly, Greece': (38.9953683, 21.9877132), ', Armenia': (4.536307, -75.6723751), 'Indiana, United States': (40.3270127, -86.1746933), 'Alba, Italy': (44.7007236, 8.0357786), 'East Sussex, United Kingdom': (50.9404266, 0.3699977891068864), 'Fornells de la Selva, Gironès, Spain': (41.9319675, 2.8090343), ', Iraq': (33.0955793, 44.1749775), 'Treviso, Veneto, Italy': (45.806691349999994, 12.206315763116372), ', Brazil': (-10.3333333, -53.2), 'North Wootton, England': (52.7923213, 0.4278194), 'Modena, Italy': (44.5384728, 10.935960870530739), 'Minas Gerais, Brazil': (-18.5264844, -44.1588654), 'Emilia-Romagna, Italy': (44.525696, 11.039437), 'Centre-Val de Loire, France': (47.5490251, 1.7324062), 'Dumfriesshire, Scotland': (55.166667, -3.5), 'Brisbane, Australia': (-27.4689682, 153.0234991), 'Carrigtwohill, ': (51.9094617, -8.2611809), 'Azores, Portugal': (37.80855645, -25.473137391245295), ', Austria': (47.59397, 14.12456), 'Basque, Pyrenees Mountains, France': (45.359277750000004, -1.1480053453043046), 'North East Victoria, ': (54.699881, -1.6031519), 'Greensboro, VT, United States': (36.0726355, -79.7919754), 'Stawley, near Wellington, Somerset, England': (50.9961449, -3.3382702), 'Central and Western Macedonia, Thessalia, Greece': (38.9953683, 21.9877132), 'Po valley region, Italy': (42.6384261, 12.674297), 'Southwestern Wisconsin, United States': (42.53116075, -90.43762550236468), 'County Wexford, Ireland': (52.46018745, -6.606515459159162), 'Valpadana, Italy': (39.60288591417616, 16.626802703803317), 'Lapland, Finland': (67.69291045, 26.728214183162986), ', United States': (39.7837304, -100.445882), 'Passendale, Belgium': (50.9003015, 3.0203891), 'Dorset, England': (50.79683685, -2.34473226124306), 'Chirac, France': (45.9140138, 0.6548543), 'North Carolina, United States': (35.6729639, -79.0392919), 'Umbria, Lazio, Italy': (42.965916, 12.490236), 'Iowa, United States': (41.9216734, -93.3122705), 'Inagh, Co Clare, ': (52.9071704, -9.2345138), 'Roxburghshire, Scotland': (56.7861112, -4.1140518), 'Sardegna, Italy': (40.0912813, 9.0305773), 'province of Brittany, France': (46.603354, 1.8883335), 'Troyes , Aube, France': (48.2971626, 4.0746257), 'Carneros, Sonoma, California, United States': (33.223027, -111.70568456233669), 'Svaneti, Samegrelo, Georgia': (42.63545205, 42.24871384619953), 'La Velle, Wisconsin, United States': (45.1699553, -109.88428658948227), 'Georgia, United States': (32.3293809, -83.1137366), 'Brickhill, Co. Clare, Ireland': (52.70642975, -8.751786760846851), 'Sulzberg, Austria': (47.52121792021591, 9.91273065974192), 'Nicasio, United States': (38.0615885, -122.6985975), 'Inagh, Co Clare, Ireland': (52.9071704, -9.2345138), 'Burgundy, France': (47.27808725, 4.222486304306048), 'Aveyron, Laguiole, France': (44.315857449999996, 2.5065697302419823), 'Centre , the department of Loiret, France': (47.5490251, 1.7324062), 'Rhone Valley, France': (46.603354, 1.8883335), 'Tasmania, Australia': (-42.035067, 146.6366887), 'South West England, United Kingdom': (51.0339991, -2.949011916021195), ', Canada': (61.0666922, -107.991707), 'Loire Valley, France': (47.44927715, -0.34954901296919916), 'Extremadura, Spain': (39.1748426, -6.1529891), 'New Jersey, United States': (40.0757384, -74.4041622), 'Nord-Pas-de-Calais, France': (50.5289634, 2.454515765955904), 'Piave Valley, Italy, Italy': (45.735099578237005, 7.320173335891282), 'Friuli-Venezia Giulia and the Veneto, Italy': (42.6384261, 12.674297), 'Co. Cork, Ireland': (51.917535900000004, -8.58597726870895), 'North Yorkshire, England': (54.13453275, -1.498628491239545), 'Illinois, United States': (40.0796606, -89.4337288), 'Gâtinais, France': (48.15497515, 2.811419156673292), 'Campania, Paestum, Foggia, Italy': (40.860672, 14.843984), 'Port Townsend, United States': (48.1179702, -122.769544), 'Piemonte, Italy': (45.060735, 7.923549), 'Bregenzerwald, Kleinwalsertal, Großwalsertal, Laiblachtal (Pfänderstock) and Rheintal, Austria': (47.387028799999996, 9.95606355528393), 'Brooklyn NY, United States': (40.6526006, -73.9497211), 'Avesnes, France': (50.5495906, 1.9721295), 'Petaluma, California, United States': (38.2325829, -122.636465), 'Lanarkshire, Scotland': (55.5752966, -3.833333), 'Co Clare, Ireland': (52.857257450000006, -8.937435925994537), 'Mankato, MN, United States': (44.1634663, -93.9993505), 'Friuli Venezia Giulia and Veneto, Italy': (42.6384261, 12.674297), 'Québec, Canada': (52.4760892, -71.8258668), 'Airedale farming district, New Zealand': (-41.5000831, 172.8344077), 'Galicia, Spain': (42.61946, -7.863112), 'Campania, Italy': (40.860672, 14.843984), 'Asiago, Italy': (45.8753771, 11.5106998), 'Monterey, California, United States': (36.2231079, -121.387742), 'Pullman, Washington, United States': (46.7304268, -117.173895), 'Devon, England': (50.724140500000004, -3.6607788161410735), 'Pesaro-Urbino, Italy': (43.694112700000005, 12.701443660480004), 'Ballarat, Victoria, Australia': (-37.5623013, 143.8605645), 'Savoie, France': (45.494895150000005, 6.384660381375652), 'Hunter Valley, Australia': (-32.5421803, 151.2185641), 'Auvergne, Salers, France': (45.2968119, 4.6604809), 'Chelmarsh, Bridgnorth, Shropshire, England': (52.4875359, -2.4124407), 'Duhallow, Ireland': (52.1837912, -9.00609563330653), ', Serbia': (44.024322850000004, 21.07657433209902), 'Stranraer, Scotland': (54.9044332, -5.026204), 'Cotswolds, England': (51.74894260792542, -0.23033349985221635), 'Manitoba, Canada': (55.001251, -97.001038), 'South West England, England': (51.50076785, -2.5503106339491204), 'Berry, France': (44.5760186, 0.3095833), 'Co Limerick, Ireland': (52.518831649999996, -8.795834650292788), 'Averyon, France': (46.603354, 1.8883335), 'Co. Mayo, Ireland': (53.9087056, -9.298304863654256), 'Corsica, France': (42.188089649999995, 9.068413771427695), 'Moliterno, Italy': (40.2423024, 15.868903), 'Castelo Branco, Fundão and Idanha-a-Nova, Portugal': (39.97675825, -7.446059929966704), 'Oristano, Italy': (40.02656765, 8.679641647435716), 'Postel, Belgium': (51.2874865, 5.1897863), ', Iceland': (64.9841821, -18.1059013), 'Brittany, France': (48.2640845, -2.9202408), 'Rio Grande do Sul, Brazil': (-29.8425284, -53.7680577), 'Greenville, Indiana, United States': (34.851354, -82.3984882), 'Macedonia, Thrace, Thessalia, Peloponissos, Ionian Islands, Aegean islands, Crete Island and Epirus, Greece': (40.6186482, 22.91795361795959), 'Shelburne Farms, United States': (34.89046225, -82.24340593189123), 'Provencale, France': (43.7899311033635, 7.524017533510311), 'Oxfordshire, Great Britain': (51.7412674, -1.2245951), 'Swabia, Germany': (48.15313125, 10.47129100603846), 'Comox Valley, Vancouver Island, Canada': (49.670981, -125.0353253), 'Dalmatia, Croatia': (43.538796500000004, 16.175235566874342), 'Murcia, Spain': (37.9923795, -1.1305431), 'Puimichel in Provence Alpes, France': (46.603354, 1.8883335), 'Peekskill, United States': (41.289811, -73.9204922), 'Menorca, Balearic Islands, Spain': (39.949257200000005, 4.0499641751186415), 'New South Wales, Australia': (-31.8759835, 147.2869493), 'Colorado, United States': (38.7251776, -105.607716), 'Piora Valley, Switzerland': (46.7985624, 8.2319736), 'Loire, France': (45.75385355, 4.045473682551104), 'Tieton, Washington, United States': (46.7020686, -120.75535), 'Oviken, Sweden': (62.9974877, 14.3928671), 'Taxco, Mexico': (18.5565446, -99.6052838), 'Rhône-Alpes, France': (45.3175313, 5.721294352585611), 'Bursa, Turkey': (39.9895878, 28.8944669), 'Nottinghamshire, England': (53.1459288, -1.0214971168122484), 'Karlovy Vary, Czech Republic': (50.2306216, 12.8701437), 'County Cavan, Ireland': (54.03497495, -7.2937022825583675), 'Northwest, United States': (34.3129464, -78.1611077), ', Germany': (51.1638175, 10.4478313), ', Sweden': (59.6749712, 14.5208584), ', Argentina': (-34.9964963, -64.9672817), 'Queenstown, New Zealand': (-45.0321923, 168.661), 'All Holland, Netherlands': (52.4601118, 4.6056526), 'Flanders, Belgium': (51.096246199999996, 4.178629103169916), 'West Pawlet, VT, United States': (43.356893, -73.24966776033015), 'Bjurholm, Sweden': (63.966667, 19.0), 'Allgaeu Alps, Germany': (51.1638175, 10.4478313), 'Somerset, England': (51.161750850000004, -3.0753867062227487), 'Herefordshire, West Midlands, United Kingdom': (52.083333, -2.75), 'Västra Götaland, Sweden': (58.215850200000006, 12.651820794914073), ', Scotland': (56.7861112, -4.1140518), 'Provence, France': (44.0580563, 6.0638506), 'Mornington Peninsula, Melbourne, Australia': (-38.3312575, 145.08106868543985), 'Haute-Savoie / Upper Savoy, France': (46.06904065, 6.344532137164), ', Middle East': (39.3014159, -76.5888477), 'Sonoma, California, United States': (38.5110803, -122.8473388), 'Veneto, Italy': (45.6476663, 11.8665254), 'Haute Vienne, France': (45.91901925, 1.203176771876291), 'Gloucestershire County, England': (51.9425914, -2.100154122305389), 'Massachusetts, United States': (42.3788774, -72.032366), 'Carmarthenshire, Wales': (51.893669849999995, -4.217282721429928), 'Orkney Isles, Scotland': (56.7861112, -4.1140518), ', Belgium': (50.6402809, 4.6667145), 'Lombardy, Italy': (45.5703694, 9.7732524), 'Oregon, United States': (43.9792797, -120.737257), 'Cheshire, England': (53.2141028, -2.471770086071205), 'Blarney, Ireland': (51.9325233, -8.5678665), 'Timsbury, Somerset, England': (51.3271927, -2.4755923), 'Veneto, Trentino, Italy': (45.6476663, 11.8665254), 'Co. Offaly, Ireland': (53.13617215, -7.810340751784169), 'Barcelona, Spain': (41.3828939, 2.1774322), 'Sardinia & Campania, Italy': (42.6384261, 12.674297), 'West Bengal, India': (22.9964948, 87.6855882), 'Banon, France': (44.0381752, 5.6296701), 'Laruns, France': (42.9882368, -0.4266324), 'Gevrey-Chambertin, Burgundy, France': (47.2261857, 4.9705666), 'Pyrenees, France': (48.8738565, 2.3852638), 'Murazzano, Italy': (44.4746494, 8.0213361), 'Southern California, United States': (34.169262950000004, -116.787448181486), 'Normandy, France': (49.0677708, 0.3138532), 'Charentes, France': (45.4039367, 0.3756199), 'island wide, Cyprus': (34.9174159, 32.889902651331866), 'Larzac, France': (44.74693, 1.0075), 'Pays d’Auge, Normandy, France': (49.0356178, 0.1573083324015645), 'Pyrenees-Atlantiques, France': (43.18718655, -0.728247400084667), 'Auvergne, France': (45.2968119, 4.6604809), 'Burgund, France': (47.27808725, 4.222486304306048), ', Portugal': (39.6621648, -8.1353519), 'Jura, Switzerland': (47.3566699, 7.1598893), 'Emilia Romagna, Italy': (44.525696, 11.039437), 'East Midlands, England': (53.1188177, -1.2597068974971675), 'Missouri, United States': (38.7604815, -92.5617875), 'Marathon, NY, United States': (44.8914036, -89.7748098), ', Holland': (52.2434979, 5.6343227), 'Ann Arbor, MI, United States': (42.2813722, -83.7484616), 'Cevenes, France': (44.3509309, 3.8584812791602983), 'Bergues, France': (50.9683886, 2.4325247), 'Pokolbin, Hunter Valley, Australia': (-32.7792106, 151.2978747), 'Pyrénées, France': (48.8738565, 2.3852638), ', Netherlands': (52.2434979, 5.6343227), 'Gippsland, Victoria, Australia': (-37.87448275, 146.9111788341666), 'Cumbrian, United Kingdom': (54.478530449999994, -3.06553306667584), 'Friuli-Venezia Giulia, Italy': (46.151042, 13.055904), 'Kilmallock County Limerick, Ireland': (52.400645600000004, -8.571161660434711), 'Gloucestershire, England': (51.7643786, -2.1880661838719386), 'Vermont, United States': (44.5990718, -72.5002608), 'Stewarton, Scotland': (55.680265, -4.5153023), 'Leiden, Netherlands': (52.1594747, 4.4908843), 'Lebanon, CT, United States': (40.375713, -76.4626118), 'Tomales, California, United States': (38.2468075, -122.90630461024097), 'Bermondsey, London, England': (51.4970125, -0.063268), 'Tipperary, Ireland': (52.4734839, -8.1614446), 'Fife, Scotland': (56.3333331, -3.0000001), 'Allgäu, Germany': (47.5926009, 10.209156), ', France': (46.603354, 1.8883335), 'French Basque Country, Midi-Pyrénées, France': (46.603354, 1.8883335), 'Severn Valley, England': (52.454530899999995, -2.3755702502240226), ', Denmark': (55.670249, 10.3333283), 'Tain, Scotland': (57.8119372, -4.0550663), 'New York, France': (44.8712241, -0.5502475), 'Pyrénées-Atlantiques, France': (43.18718655, -0.728247400084667), 'Buxton, Derbyshire, England': (53.2593422, -1.9100768), 'Galax, Virginia, United States': (36.6612387, -80.9239671), 'Wallonia, Belgium': (50.154540049999994, 5.399359762971196), 'Ile-de-France/Champagne, France': (48.5499711, 7.7508704), 'Lazio, Sardinia, Italy': (41.9808038, 12.7662312), 'Staffordshire, England': (52.824694199999996, -2.0074546723348115), ', Switzerland': (46.7985624, 8.2319736), 'Serra da Estrela, Portugal': (40.4358994, -7.516865473467464), 'County Carlow, Ireland': (52.69078865, -6.825145150844913), 'St. Louis, Missouri, United States': (38.6280278, -90.1910154), 'Coquet, England': (54.88091196980861, -1.5495607774216265), 'Béarnaise in Pyrénées-Atlantique, France': (46.603354, 1.8883335), 'Websterville, VT, United States': (44.162985, -72.47576806895253), ', Poland': (52.215933, 19.134422), 'Utah, United States': (39.4225192, -111.714358), 'Allagau, Bavarian Alps, Germany': (51.1638175, 10.4478313), 'Oregon Coast Range, United States': (39.7837304, -100.445882), 'Cotherstone, England': (54.570244, -1.9804176), 'Swaledale, North Yorkshire, England': (54.38299324007608, -1.9841360652878535), 'Bornholm, Denmark': (55.143122399999996, 14.922629658767558), 'Aquitaine, France': (44.24620635, -0.18399787392367906), 'old Liburnia (Dalmatia), Croatia': (45.3658443, 15.6575209), 'Fethard, Co Tipperary, Ireland': (52.467222, -7.691111), 'Northern Holland, Netherlands': (52.2434979, 5.6343227), 'Castile-Leon, Spain': (41.55005, -5.1387401), 'Naples, Italy': (40.8358846, 14.2487679), 'Gravina in Puglia, Murgia, Italy': (40.819725, 16.422779), 'Castille-Leon, Spain': (41.55005, -5.1387401), ', Israel': (30.8124247, 34.8594762), 'Languedoc-Roussillon, France': (43.65420305, 3.674669940206605), 'Orkney Islands, Scotland': (58.94182309999999, -3.129694439563327), ', Italy': (42.6384261, 12.674297), ', United Kingdom': (54.7023545, -3.2765753), 'Wales, Great Britain': (53.28236125, -3.8286207326666837), 'Wales, London, Wales': (52.41446365, -4.0685073132923), 'California, United States': (36.7014631, -118.755997), 'Belvederis, Lithuania': (55.0820118, 23.3897023), 'Franche Comté, France': (48.68347355, 2.1776625116070027), 'Kent, United Kingdom': (51.20707485, 0.7210361813401444), 'Bloomdale, United States': (33.2473378, -96.6794382), 'Wigtownshire, Scotland': (54.9042579, -5.0248893), ', Ireland': (52.865196, -7.9794599), 'County Tipperary, Clogheen, Ireland': (52.68482145, -7.898147186112796), 'Colby, Wisconsin, United States': (44.5684775, -69.66002565150262), 'Isere, France': (45.28979315, 5.634382477386232), 'Kinfauns, Perthshire, Scotland': (56.3822607, -3.36565), ', Mexico': (23.6585116, -102.0077097), 'Dumfries, Scotland': (55.0691397, -3.6107936), 'Odell, Bedfordshire, England': (52.21843025, -0.5921260787763352), 'Avila, Spain': (40.656478, -4.7002172), 'Bethania, United Kingdom': (52.2509586, -4.0888576), 'Lincolnshire, England': (53.1823034, -0.2031208542548153), 'Hamilton, New Zealand': (-37.7878809, 175.281788), ', Greece': (38.9953683, 21.9877132), 'New York, United States': (40.7127281, -74.0060152), ', Cyprus': (34.9174159, 32.889902651331866), 'South Australia, Australia': (-30.5343665, 135.6301212), 'Low-laying regions, Sweden': (59.6749712, 14.5208584), 'Serra da Canastra, Minas Gerais state, Brazil': (-20.1615, -46.76365461658604), 'Cornwall, ': (50.443348900000004, -4.62465658489158), 'St Antoine, France': (44.0361186, 0.8397552), 'Amou, Gascony, France': (43.59266, -0.7475291), 'Charentes-Poitou, France': (45.4039367, 0.3756199), 'Co. Carlow, Ireland': (52.69078865, -6.825145150844913), 'Äänekoski, Finland': (62.6032186, 25.7301361), ', Spain': (39.3260685, -4.8379791), 'Ile de France, France': (48.6443057, 2.7537863), 'Seattle, Washington, United States': (47.6038321, -122.330062), 'Minnesota, United States': (45.9896587, -94.6113288), 'Milford, NJ, United States': (41.2222218, -73.0570603), 'Charm, Ohio, United States': (40.5067308, -81.7848553), 'Anjou, France': (45.3462, 4.88149), 'Pinconning, Michigan, United States': (43.853633, -83.964987), 'Derbyshire, Leicestershire, Nottinghamshire, England': (53.1666927, -1.5833223), 'Gujarat, India': (22.3850051, 71.745261), ', Mongolia': (46.8250388, 103.8499736), 'Central Balkan Mountains, Bulgaria': (42.6073975, 25.4856617), 'Schoonrewoerd, Leerdam, Netherlands': (51.920458, 5.1156505), 'North East Victoria, Australia': (-37.8633951, 145.0100994), 'Bavaria, Germany': (48.9467562, 11.4038717), 'Kimball, United States': (41.1881305, -103.6997645), 'Illoud (Haute-Marne), France': (48.2089823, 5.5615126), 'Ann Arbor, Michigan, United States': (42.2813722, -83.7484616), 'Rhone-Alps, France': (45.2968119, 4.6604809), 'Mols, Denmark': (56.187042, 10.460782482125193), 'Island of Pag, Croatia': (45.3658443, 15.6575209), ', Hungary': (47.1817585, 19.5060937), 'Lower Normandy, France': (48.953684499999994, -0.573365358805311), 'Midi-Pyrenees, France': (43.8099068, 1.4344926056549236), 'Huizen, Netherlands': (52.2958122, 5.2567209), 'Upper Corsica, France': (46.603354, 1.8883335), 'Basilicata, Italy': (40.500571, 16.081953), 'Landford, England': (50.9700788, -1.6363792), 'Maribo, Denmark': (54.7758018, 11.5054333), 'Virginia, United States': (37.1232245, -78.4927721), 'Adamstown, Co Wexford, Ireland': (53.3360017, -6.4692321), 'Het Groene Hart, Netherlands': (51.5246, 4.280818038775446), 'Sebastopol, California, United States': (38.4021038, -122.824222), 'Carrigtwohill, Ireland': (51.9094617, -8.2611809), 'County Antrim, Ireland': (54.864725500000006, -6.143637910742768), 'Aberdeenshire, Scotland': (57.166667, -2.666667), 'massif des Causses, France': (46.603354, 1.8883335), 'Asturias, Spain': (43.3133868, -5.94192), 'Allgau, Germany': (47.8241593, 11.6822424), 'Croisy-sur-Eure, France': (49.0291802, 1.346505), 'Northern Wisconsin, United States': (44.94725995, -91.39373410986752), 'Carnia, Italy': (46.3738716, 13.1339829), 'Vorarlberg, Austria': (47.25, 9.9166667), 'Quebec, Canada': (52.4760892, -71.8258668), 'Canary Islands, Spain': (28.286398900000002, -16.796011808910734), 'Banks Peninsular in Canterbury, New Zealand': (-41.5000831, 172.8344077), 'Beira Baixa Province, Portugal': (39.6621648, -8.1353519), 'Fairview, United States': (40.6333724, -90.1637318), 'Aconcagua, Chile': (-33.04383715040669, -71.56622455102398), 'Midi-Pyrénées, France': (43.8099068, 1.4344926056549236), 'Landshut, Germany': (48.536217, 12.1516551), ', New Zealand': (-41.5000831, 172.8344077), ', England': (52.5310214, -1.2649062), 'Languedoc, France': (43.65420305, 3.674669940206605), ', Afghanistan': (33.7680065, 66.2385139), 'NY, United States': (43.1561681, -75.8449946), 'Northeastern Brazil, Brazil': (-10.3333333, -53.2), 'Piedmont, Italy': (45.060735, 7.923549), 'St. Gallen (canton), Tufertschwil, Switzerland': (47.1561047, 9.338323), 'Pembrokeshire, United Kingdom': (51.8339209, -4.916667), 'Canton of Glarus, Switzerland': (46.7985624, 8.2319736), 'South East England, United Kingdom': (51.45115235, -0.9935673736185868), 'Ceredigion, United Kingdom': (52.2945764, -3.9527809990291427), 'Stonegate, East Sussex, England': (53.960910892985034, -1.0833748506182423), 'Tuscany, Italy': (43.4586541, 11.1389204), 'Timsbury, Somerset, Scotland': (56.7861112, -4.1140518), \"Lucerne, Schwyz, Unterwald, and Zoug, and the following additional places: Muri district in d'Argovi, Switzerland\": (47.0505452, 8.3054682), 'Prince Edward Island, Canada': (46.3355508, -63.1466676), 'Prince Edward County, Ontario, Canada': (44.031827, -77.246933), 'Aveyron, France': (44.315857449999996, 2.5065697302419823), 'Calabria, Italy': (39.0565974, 16.5249864), 'British Columbia, Canada': (55.001251, -125.002441), 'Ontario, Canada': (50.000678, -86.000977), 'North Cornwall, England': (51.7561518, 0.4645198), 'Pennsylvania, United States': (40.9699889, -77.7278831), 'Coast of Oregon, United States': (39.7837304, -100.445882), 'Veneto, ': (45.6476663, 11.8665254), ', Australia': (-24.7761086, 134.755), 'Victoria, Australia': (-36.5986096, 144.6780052), 'Pays Basque, France': (47.6867895, 7.3927627), ', Mauritania': (20.2540382, -9.2399263), 'Richfield, Wisconsin, United States': (44.8766431, -93.2877877), 'Poitou-Charentes, France': (46.13244785, -0.15455354898441043), 'Pienza, Italy': (43.0765485, 11.6789076), 'Herault, France': (43.591422, 3.3553309364095925), 'Normandy, Auvilliers, France': (49.0677708, 0.3138532), 'Bourgogne, France': (47.27808725, 4.222486304306048), 'Póvoa de Lanhoso, Portugal': (41.5759516, -8.2699521), 'Cornwall, England': (50.416667, -4.75), 'Roncq, France': (50.7531232, 3.1209016), 'Laqueuille, France': (45.6507627, 2.7320917), 'Bas-Languedoc, Comtat Venaissin, France': (43.687621, 4.2691037), 'Zasavica, Serbia': (44.9454307, 19.4987239)}\n" + ] + } + ], + "source": [ + "print(locations_to_gps)" ] }, { "cell_type": "code", "execution_count": 75, - "id": "d41b1dc8-90df-44b8-9d83-d218f82a3637", + "id": "c82851db-2726-4f3a-977c-fef529d9fd8c", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "{', Mexico and Caribbean'}\n" + ] + } + ], + "source": [ + "print(errors)" + ] + }, + { + "cell_type": "code", + "execution_count": 76, + "id": "f86ec162-6391-49f5-964a-f70f17163a4a", "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "[