-
Notifications
You must be signed in to change notification settings - Fork 8
/
Copy pathclustering_samples.py
94 lines (94 loc) · 8.65 KB
/
clustering_samples.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
CLUSTERING_CATEGORIES = {
"fruits": ["apple", "banana", "mango", "pear", "peach", "orange", "grape", "kiwi"],
"car_brands": ["Toyota", "Ford", "BMW", "Tesla", "GMC", "Kia", "Honda", "Volkswagen", "Nissan", "Mercedes-Benz"],
"government_types": ["democracy", "dictatorship", "monarchy", "oligarchy", "republic", "theocracy"],
"musical_instruments": ["guitar", "piano", "drums", "violin", "trumpet", "flute", "saxophone"],
"sports": ["soccer", "basketball", "tennis", "volleyball", "swimming", "cricket", "baseball"],
"colors": ["red", "blue", "green", "yellow", "purple", "orange", "pink"],
"planets": ["Mars", "Venus", "Jupiter", "Neptune", "Saturn", "Mercury", "Uranus", "Earth"],
"emotions": ["happiness", "anger", "sadness", "fear", "surprise", "disgust", "joy"],
"seasons": ["spring", "summer", "winter", "fall"],
"elements": ["oxygen", "carbon", "hydrogen", "nitrogen", "iron", "calcium", "sodium"],
"languages": ["English", "Mandarin", "Spanish", "Hindi", "Arabic", "French", "Russian"],
"animals": ["lion", "elephant", "penguin", "tiger", "giraffe", "dolphin", "koala"],
"oceans": ["Pacific", "Atlantic", "Indian", "Arctic", "Southern"],
"cuisines": ["Italian", "Chinese", "Mexican", "Indian", "French", "Japanese", "Thai"],
"board_games": ["chess", "Monopoly", "Scrabble", "Catan", "Clue", "Risk"],
"currencies": ["dollar", "euro", "yen", "pound", "yuan", "rupee", "franc"],
"cloud_types": ["cumulus", "stratus", "cirrus", "nimbus", "altostratus"],
"precious_stones": ["diamond", "ruby", "emerald", "sapphire", "topaz", "opal", "amethyst"],
"art_movements": ["Impressionism", "Cubism", "Surrealism", "Renaissance", "Baroque", "Abstract Expressionism"],
"social_media_platforms": ["Facebook", "Twitter", "Instagram", "LinkedIn", "TikTok", "Pinterest", "Snapchat"],
"mythical_creatures": ["dragon", "unicorn", "phoenix", "griffin", "mermaid", "centaur", "werewolf"],
"computer_parts": ["CPU", "RAM", "GPU", "hard drive", "motherboard", "power supply", "SSD"],
"literary_genres": ["romance", "mystery", "science fiction", "fantasy", "horror", "thriller", "historical fiction"],
"dance_styles": ["ballet", "hip-hop", "salsa", "contemporary", "tap", "jazz", "ballroom"],
"renewable_energy_sources": ["solar", "wind", "hydroelectric", "geothermal", "biomass", "tidal"],
"phobias": ["arachnophobia", "claustrophobia", "acrophobia", "agoraphobia", "ophidiophobia", "nyctophobia"],
"ancient_civilizations": ["Egyptian", "Greek", "Mayan", "Roman", "Mesopotamian", "Incan", "Chinese"],
"coffee_types": ["espresso", "cappuccino", "latte", "americano", "mocha", "macchiato", "cold brew"],
"movie_genres": ["comedy", "horror", "action", "drama", "romance", "thriller", "documentary"],
"olympic_sports": ["gymnastics", "swimming", "archery", "athletics", "cycling", "judo", "rowing"],
"types_of_rocks": ["igneous", "sedimentary", "metamorphic"],
"punctuation_marks": ["comma", "period", "semicolon", "colon", "exclamation point", "question mark", "hyphen"],
"school_subjects": ["mathematics", "history", "biology", "physics", "literature", "chemistry", "geography"],
"weather_phenomena": ["tornado", "hurricane", "blizzard", "thunderstorm", "hailstorm", "fog", "drought"],
"cooking_methods": ["boiling", "frying", "baking", "grilling", "roasting", "steaming", "sautéing"],
"types_of_teeth": ["incisor", "canine", "molar", "premolar", "wisdom tooth"],
"constellations": ["Orion", "Ursa Major", "Cassiopeia", "Leo", "Scorpius", "Cygnus", "Taurus"],
"political_ideologies": ["conservatism", "liberalism", "socialism", "fascism", "anarchism", "communism"],
"blood_types": ["A", "B", "O", "AB"],
"types_of_poems": ["sonnet", "haiku", "limerick", "free verse", "ballad", "ode", "epic"],
"geometric_shapes": ["triangle", "square", "circle", "rectangle", "pentagon", "hexagon", "octagon"],
"chemical_states": ["solid", "liquid", "gas", "plasma"],
"types_of_forests": ["tropical", "temperate", "boreal", "mangrove", "cloud"],
"vitamins": ["C", "D", "E", "K", "B1", "B12"],
"video_game_consoles": ["PlayStation", "Xbox", "Nintendo", "Sega", "Atari"],
"types_of_pasta": ["spaghetti", "penne", "lasagna", "fettuccine", "ravioli", "linguine", "fusilli"],
"cognitive_biases": ["confirmation bias", "anchoring bias", "availability bias", "dunning-kruger effect", "hindsight bias"],
"types_of_bridges": ["suspension", "arch", "truss", "beam", "cantilever", "cable-stayed"],
"programming_languages": ["Python", "Java", "C++", "JavaScript", "Ruby", "Swift", "Go"],
"zodiac_signs": ["Aries", "Leo", "Scorpio", "Taurus", "Virgo", "Capricorn", "Gemini", "Libra", "Aquarius", "Cancer"],
"dog_breeds": ["Labrador", "Poodle", "Chihuahua", "German Shepherd", "Bulldog", "Golden Retriever", "Beagle"],
"clothing_materials": ["cotton", "polyester", "silk", "wool", "linen", "denim", "leather"],
"fast_food_chains": ["McDonald's", "KFC", "Subway", "Burger King", "Wendy's", "Taco Bell", "Pizza Hut"],
"tree_types": ["oak", "pine", "maple", "birch", "willow", "cedar", "elm"],
"alcoholic_beverages": ["beer", "wine", "whiskey", "vodka", "rum", "gin", "tequila"],
"continents": ["Africa", "Asia", "Europe", "North America", "South America", "Australia", "Antarctica"],
"bread_types": ["sourdough", "rye", "ciabatta", "baguette", "brioche", "focaccia", "pumpernickel"],
"shoe_types": ["sneakers", "sandals", "boots", "loafers", "high heels", "flats"],
"dinosaurs": ["Tyrannosaurus", "Stegosaurus", "Velociraptor", "Triceratops", "Brachiosaurus", "Pteranodon", "Ankylosaurus"],
"mobile_phone_brands": ["Apple", "Samsung", "Huawei", "Xiaomi", "OnePlus", "Google", "LG"],
"flower_types": ["rose", "tulip", "sunflower", "daisy", "lily", "orchid", "carnation"],
"music_genres": ["rock", "jazz", "classical", "hip-hop", "country", "electronic", "reggae"],
"transportation_modes": ["car", "bicycle", "airplane", "train", "bus", "boat", "motorcycle"],
"restaurant_types": ["fine dining", "fast casual", "buffet", "cafe", "bistro", "steakhouse", "sushi bar"],
"body_organs": ["heart", "liver", "brain", "lungs", "kidneys", "stomach", "pancreas"],
"hat_types": ["baseball cap", "fedora", "beanie", "beret", "cowboy hat", "top hat", "bowler"],
"ancient_wonders": ["Pyramids of Giza", "Hanging Gardens of Babylon", "Colossus of Rhodes", "Lighthouse of Alexandria", "Temple of Artemis", "Statue of Zeus", "Mausoleum at Halicarnassus"],
"insurance_types": ["life", "health", "auto", "home", "travel", "disability", "pet"],
"mountain_types": ["fold", "block", "volcanic", "dome", "plateau"],
"tea_types": ["green", "black", "oolong", "white", "pu-erh", "chamomile", "rooibos"],
"mythologies": ["Greek", "Norse", "Egyptian", "Roman", "Celtic", "Hindu", "Chinese"],
"web_browsers": ["Chrome", "Firefox", "Safari", "Edge", "Opera", "Brave"],
"farm_types": ["dairy", "crop", "poultry", "livestock", "fruit", "vegetable", "mixed"],
"martial_arts": ["karate", "judo", "taekwondo", "kung fu", "aikido", "jiu-jitsu", "muay thai"],
"boat_types": ["sailboat", "kayak", "yacht", "canoe", "motorboat", "catamaran", "cruise ship"],
"literary_devices": ["metaphor", "simile", "personification", "alliteration", "hyperbole", "irony", "onomatopoeia"],
"plastic_types": ["polyethylene", "polypropylene", "PVC", "polystyrene", "nylon", "acrylic"],
"cloud_services": ["AWS", "Azure", "Google Cloud", "IBM Cloud", "Oracle Cloud", "DigitalOcean"],
"volcano_types": ["shield", "composite", "cinder cone", "caldera", "lava dome"],
"personality_traits": ["extroversion", "conscientiousness", "openness", "agreeableness", "neuroticism"],
"celestial_objects": ["star", "galaxy", "nebula", "planet", "asteroid", "comet", "black hole"],
"neuron_types": ["sensory", "motor", "interneuron", "pyramidal", "Purkinje"],
"soil_types": ["clay", "sand", "loam", "silt", "peat", "chalk"],
"writing_tools": ["pen", "pencil", "marker", "fountain pen", "quill", "chalk", "crayon"],
"mirror_types": ["plane", "convex", "concave", "parabolic"],
"wind_instruments": ["flute", "clarinet", "saxophone", "trumpet", "trombone", "oboe", "bassoon"],
"fish_types": ["salmon", "tuna", "cod", "trout", "bass", "halibut", "mackerel"],
"hair_colors": ["blonde", "brunette", "redhead", "black", "gray", "white", "auburn"],
"camping_gear": ["tent", "sleeping bag", "flashlight", "backpack", "camping stove", "water filter", "compass"],
"lens_types": ["convex", "concave", "bifocal", "toric", "progressive", "prismatic"],
"gardening_tools": ["shovel", "rake", "pruning shears", "trowel", "hoe", "watering can", "wheelbarrow"],
"desert_types": ["hot and dry", "semi-arid", "coastal", "cold", "polar"]
}