import nltk
from nltk.corpus import words
import random
import string

# Download NLTK word list
nltk.download('words', quiet=True)

# Get NLTK word list
NLTK_WORDS = set(words.words())

# English word list (focusing on short words)
ENGLISH_WORDS = [
    # 3-4 character words (basic)
    'art', 'box', 'cat', 'dog', 'egg', 'fox', 'hat', 'ice', 'jam', 'key',
    'log', 'map', 'net', 'oil', 'pen', 'rat', 'sun', 'tea', 'use', 'van',
    'web', 'yes', 'zip', 'air', 'bus', 'cup', 'day', 'eye', 'fly', 'gas',
    'hot', 'ink', 'joy', 'kid', 'law', 'man', 'now', 'old', 'pig', 'red',
    'sky', 'top', 'up', 'win', 'zoo', 'arm', 'bed', 'car', 'desk', 'ear',
    
    # 3-4 character words (additional)
    'ace', 'bad', 'cow', 'dry', 'end', 'fit', 'gap', 'hit', 'jet', 'kit',
    'low', 'mix', 'new', 'odd', 'pay', 'raw', 'set', 'try', 'use', 'via',
    'way', 'yes', 'zap', 'act', 'big', 'cut', 'dig', 'eat', 'fix', 'get',
    'hit', 'jog', 'key', 'let', 'mix', 'nap', 'own', 'put', 'run', 'sit',
    
    # 5-6 character words (basic)
    'apple', 'beach', 'cloud', 'dream', 'earth', 'field', 'green', 'house',
    'island', 'jelly', 'knife', 'light', 'music', 'night', 'ocean', 'paper',
    'queen', 'river', 'stone', 'table', 'umbrella', 'voice', 'water', 'xray',
    'yellow', 'zebra', 'alpha', 'brave', 'candy', 'dance', 'eagle', 'flame',
    'ghost', 'heart', 'ivory', 'jewel', 'kite', 'lemon', 'magic', 'noble',
    
    # 5-6 character words (additional)
    'amber', 'bloom', 'coral', 'daisy', 'ember', 'frost', 'glade', 'honey',
    'ivory', 'jade', 'kale', 'lunar', 'moss', 'navy', 'opal', 'pearl',
    'quartz', 'ruby', 'sapphire', 'topaz', 'umber', 'violet', 'wine', 'xenon',
    'yellow', 'zinc', 'azure', 'bronze', 'copper', 'diamond', 'emerald',
    'fuchsia', 'golden', 'honey', 'indigo', 'jade', 'khaki', 'lilac',
    
    # 5-6 character words (technical)
    'alpha', 'beta', 'cache', 'delta', 'echo', 'flash', 'gamma', 'host',
    'input', 'jump', 'kernel', 'logic', 'matrix', 'node', 'output', 'proxy',
    'query', 'router', 'server', 'target', 'update', 'vector', 'window',
    'xenon', 'yield', 'zenith', 'access', 'binary', 'client', 'domain',
    
    # 7-8 character words (basic)
    'academy', 'breeze', 'crystal', 'diamond', 'eclipse', 'freedom', 'garden',
    'harmony', 'infinity', 'journey', 'kingdom', 'liberty', 'mountain',
    'nature', 'ocean', 'paradise', 'quality', 'rainbow', 'sunshine',
    'treasure', 'universe', 'victory', 'wisdom', 'xenial', 'yearning',
    
    # 7-8 character words (additional)
    'abundant', 'brilliant', 'creative', 'delicate', 'elegant', 'fragrant',
    'graceful', 'harmonious', 'inspiring', 'joyful', 'kindred', 'luminous',
    'majestic', 'noble', 'peaceful', 'radiant', 'serene', 'tranquil',
    'unique', 'vibrant', 'wholesome', 'xenial', 'yearning', 'zealous',
    
    # 7-8 character words (technical)
    'advanced', 'browser', 'computer', 'database', 'encrypt', 'firewall',
    'gateway', 'hardware', 'internet', 'junction', 'keyboard', 'language',
    'monitor', 'network', 'operator', 'protocol', 'quantum', 'realtime',
    'software', 'terminal', 'upstream', 'virtual', 'wireless', 'xenon',
    'yield', 'zenith',
    # Add words with 10+ characters
    'strawberry', 'watermelon', 'honeydew', 'blueberry',
    'raspberry', 'blackberry', 'cranberry', 'elderberry',
    'gooseberry', 'huckleberry', 'strawberry', 'watermelon',
    'pineapple', 'pomegranate', 'rhubarb', 'strawberry',
    'tangerine', 'watermelon', 'zucchini', 'strawberry',
    'watermelon', 'honeydew', 'blueberry', 'raspberry',
    'blackberry', 'cranberry', 'elderberry', 'gooseberry',
    'huckleberry', 'strawberry', 'watermelon', 'pineapple',
    'pomegranate', 'rhubarb', 'strawberry', 'tangerine',
    'watermelon', 'zucchini', 'strawberry', 'watermelon'
]

def shuffle_word(word):
    """Shuffle characters within a word"""
    chars = list(word)
    random.shuffle(chars)
    return ''.join(chars)

# English word list (with shuffled characters in each word)
SHUFFLED_ENGLISH_WORDS = [
    shuffle_word(word) for word in ENGLISH_WORDS
]

# German word list (only non-overlapping with NLTK words)
GERMAN_WORDS = [
    word for word in [
        # 3-4 character words (basic)
        'alt', 'bad', 'das', 'ein', 'frei', 'gut', 'haus', 'ich', 'ja', 'kalt',
        'lang', 'mein', 'neu', 'oder', 'post', 'rot', 'satz', 'tag', 'und', 'von',
        'weg', 'zeit', 'arm', 'dank', 'eins', 'fuss', 'gold', 'hand', 'jahr',
        'kopf', 'luft', 'maus', 'nord', 'ost', 'park', 'raum', 'saft', 'tier', 'warm',
        
        # 3-4 character words (additional)
        'ach', 'berg', 'dort', 'ecke', 'feld', 'gast', 'holz', 'jagd', 'kino',
        'land', 'mild', 'nett', 'plan', 'ring', 'soll', 'toll', 'voll', 'wild',
        'zart', 'brot', 'dunk', 'eile', 'fest', 'gern', 'hell', 'klar', 'laut',
        
        # 5-6 character words (basic)
        'abend', 'braun', 'danke', 'essen', 'frage', 'garten', 'herbst', 'idee',
        'junge', 'kinder', 'leben', 'morgen', 'nacht', 'orange', 'pferd', 'quelle',
        'reise', 'sommer', 'traum', 'urlaub', 'vogel', 'winter', 'zimmer', 'apfel',
        'brot', 'durst', 'eimer', 'fisch', 'gross', 'himmel', 'immer', 'jung',
        
        # 5-6 character words (additional)
        'abend', 'braun', 'danke', 'essen', 'frage', 'garten', 'herbst', 'idee',
        'junge', 'kinder', 'leben', 'morgen', 'nacht', 'orange', 'pferd', 'quelle',
        'reise', 'sommer', 'traum', 'urlaub', 'vogel', 'winter', 'zimmer', 'apfel',
        'brot', 'durst', 'eimer', 'fisch', 'gross', 'himmel', 'immer', 'jung',
        
        # 7-8 character words (basic)
        'abenteuer', 'brillant', 'diamant', 'elefant', 'freiheit',
        'garten', 'harmonie', 'infinity', 'jubel', 'kreativ', 'liebe', 'majestaet',
        'natur', 'oase', 'paradise', 'qualitaet', 'regenbogen', 'sonnenschein',
        'traum', 'universum', 'viktoria', 'weisheit', 'xenial', 'jahr',
        
        # 7-8 character words (additional)
        'abundant', 'brillant', 'kreativ', 'delikat', 'elegant', 'fragrant',
        'graziös', 'harmonisch', 'inspirierend', 'jubelnd', 'kreativ', 'leuchtend',
        'majestaetisch', 'nobel', 'friedlich', 'strahlend', 'seren', 'tranquil',
        'einzigartig', 'vibrant', 'wholesome', 'xenial', 'yearning', 'zealous',
        
        # New words (3-4 characters)
        'axt', 'brot', 'dach', 'ecke', 'fels', 'gras', 'hut', 'jagd', 'korn',
        'luft', 'moor', 'nest', 'ofen', 'pult', 'raum', 'sand', 'turm', 'wald',
        'zeit', 'zorn', 'arm', 'brot', 'dank', 'eile', 'fuss', 'gold', 'hand',
        
        # New words (5-6 characters)
        'abend', 'braun', 'danke', 'essen', 'frage', 'garten', 'herbst', 'idee',
        'junge', 'kinder', 'leben', 'morgen', 'nacht', 'orange', 'pferd', 'quelle',
        'reise', 'sommer', 'traum', 'urlaub', 'vogel', 'winter', 'zimmer', 'apfel',
        'brot', 'durst', 'eimer', 'fisch', 'gross', 'himmel', 'immer', 'jung',
        
        # New words (7-8 characters)
        'abenteuer', 'brillant', 'diamant', 'elefant', 'freiheit', 'garten',
        'harmonie', 'infinity', 'jubel', 'kreativ', 'liebe', 'majestaet', 'natur',
        'oase', 'paradise', 'qualitaet', 'regenbogen', 'sonnenschein', 'traum',
        # Add words with 10+ characters
        'erdbeere', 'wassermelone', 'honigmelone', 'blaubeere',
        'himbeere', 'brombeere', 'preiselbeere', 'holunderbeere',
        'stachelbeere', 'heidelbeere', 'erdbeere', 'wassermelone',
        'ananas', 'granatapfel', 'rhabarber', 'erdbeere',
        'mandarine', 'wassermelone', 'zucchini', 'erdbeere',
        'wassermelone', 'honigmelone', 'blaubeere', 'himbeere',
        'brombeere', 'preiselbeere', 'holunderbeere', 'stachelbeere',
        'heidelbeere', 'erdbeere', 'wassermelone', 'ananas',
        'granatapfel', 'rhabarber', 'erdbeere', 'mandarine',
        'wassermelone', 'zucchini', 'erdbeere', 'wassermelone'
    ] if word.lower() not in NLTK_WORDS
]

# Dutch word list (only non-overlapping with NLTK words)
DUTCH_WORDS = [
    word for word in [
        # 3-4 character words (basic)
        'aan', 'bij', 'dag', 'een', 'fijn', 'goed', 'huis', 'ik', 'ja', 'koud',
        'lang', 'mijn', 'nieuw', 'of', 'post', 'rood', 'snel', 'tijd', 'uit', 'van',
        'weg', 'zijn', 'arm', 'dank', 'een', 'fout', 'goud', 'hand', 'jaar',
        'kop', 'lucht', 'muis', 'noord', 'oost', 'park', 'ruim', 'sap', 'tier', 'warm',
        
        # 3-4 character words (additional)
        'bak', 'dak', 'eik', 'gat', 'hut', 'ijs', 'kas', 'lot', 'mat', 'net',
        'oog', 'pad', 'rok', 'sok', 'tak', 'uur', 'vat', 'wip', 'zak', 'zon',
        'aap', 'bal', 'dier', 'eend', 'fles', 'glas', 'haar', 'jurk', 'kast', 'lamp',
        
        # 5-6 character words (basic)
        'avond', 'bruin', 'dank', 'eten', 'vraag', 'tuin', 'herfst', 'idee',
        'jong', 'kinder', 'leven', 'morgen', 'nacht', 'oranje', 'paard', 'bron',
        'reis', 'zomer', 'droom', 'vakantie', 'vogel', 'winter', 'kamer', 'appel',
        'brood', 'dorst', 'emmer', 'vis', 'groot', 'hemel', 'altijd', 'jong',
        
        # 5-6 character words (additional)
        'appel', 'beker', 'dakpan', 'eikels', 'flesje', 'gras', 'honing', 'jassen',
        'kastje', 'lampen', 'muziek', 'natuur', 'oogjes', 'pannen', 'raam', 'schoen',
        'tafel', 'uren', 'vriend', 'winkel', 'zomer', 'appel', 'beker', 'dakpan',
        
        # 7-8 character words (basic)
        'avontuur', 'briljant', 'computer', 'diamant', 'olifant', 'vrijheid',
        'tuin', 'harmonie', 'oneindig', 'vreugde', 'creatief', 'liefde', 'majesteit',
        'natuur', 'oase', 'paradijs', 'kwaliteit', 'regenboog', 'zonneschijn',
        'droom', 'universum', 'victorie', 'wijsheid', 'xenial', 'jaar',
        
        # 7-8 character words (additional)
        'appeltaart', 'bessen', 'druiven', 'eikenhout', 'framboos', 'goudvis',
        'honingbij', 'jasmijn', 'kastanje', 'lavendel', 'madelief', 'narcis',
        'orchidee', 'pioenroos', 'rozen', 'seringen', 'tulp', 'viooltje',
        'wildebloem', 'zonnebloem',
        
        # New words (3-4 characters)
        'aap', 'bal', 'dak', 'eik', 'gat', 'hut', 'ijs', 'kas', 'lot', 'mat',
        'net', 'oog', 'pad', 'rok', 'sok', 'tak', 'uur', 'vat', 'wip', 'zak',
        'zon', 'aap', 'bal', 'dier', 'eend', 'fles', 'glas', 'haar', 'jurk',
        
        # New words (5-6 characters)
        'appel', 'beker', 'dakpan', 'eikels', 'flesje', 'gras', 'honing', 'jassen',
        'kastje', 'lampen', 'muziek', 'natuur', 'oogjes', 'pannen', 'raam', 'schoen',
        'tafel', 'uren', 'vriend', 'winkel', 'zomer', 'appel', 'beker', 'dakpan',
        
        # New words (7-8 characters)
        'avontuur', 'briljant', 'computer', 'diamant', 'olifant', 'vrijheid',
        'tuin', 'harmonie', 'oneindig', 'vreugde', 'creatief', 'liefde', 'majesteit',
        'natuur', 'oase', 'paradijs', 'kwaliteit', 'regenboog', 'zonneschijn',
        # Add words with 10+ characters
        'aardbei', 'watermeloen', 'honingmeloen', 'bosbes',
        'framboos', 'braambes', 'rode bes', 'vlierbes',
        'kruisbes', 'blauwe bes', 'aardbei', 'watermeloen',
        'ananas', 'granaatappel', 'rabarber', 'aardbei',
        'mandarijn', 'watermeloen', 'courgette', 'aardbei',
        'watermeloen', 'honingmeloen', 'bosbes', 'framboos',
        'braambes', 'rode bes', 'vlierbes', 'kruisbes',
        'blauwe bes', 'aardbei', 'watermeloen', 'ananas',
        'granaatappel', 'rabarber', 'aardbei', 'mandarijn',
        'watermeloen', 'courgette', 'aardbei', 'watermeloen'
    ] if word.lower() not in NLTK_WORDS
]

# French word list (only non-overlapping with NLTK words)
FRENCH_WORDS = [
    word for word in [
        # 3-4 character words (basic)
        'age', 'bas', 'cafe', 'don', 'eau', 'fin', 'gare', 'ici', 'jour', 'lune',
        'main', 'nuit', 'or', 'pain', 'rose', 'soleil', 'temps', 'un', 'vent', 'zinc',
        'ami', 'bleu', 'chat', 'dame', 'elle', 'fleur', 'gout', 'haut', 'jour', 'lait',
        
        # 3-4 character words (additional)
        'arc', 'bleu', 'chat', 'dame', 'eau', 'fils', 'gout', 'haut', 'ici', 'jour',
        'lune', 'main', 'nuit', 'or', 'pain', 'rose', 'soleil', 'temps', 'un', 'vent',
        'zinc', 'ami', 'bleu', 'chat', 'dame', 'elle', 'fleur', 'gout', 'haut', 'jour',
        
        # 5-6 character words (basic)
        'amour', 'belle', 'couleur', 'dormir', 'ecrire', 'fleur', 'garcon', 'hiver',
        'idee', 'journee', 'livre', 'maison', 'nature', 'orange', 'parler', 'quatre',
        'revoir', 'soleil', 'table', 'univers', 'voyage', 'zebre', 'appel', 'bureau',
        
        # 5-6 character words (additional)
        'appel', 'bureau', 'couleur', 'dormir', 'ecrire', 'fleur', 'garcon', 'hiver',
        'idee', 'journee', 'livre', 'maison', 'nature', 'orange', 'parler', 'quatre',
        'revoir', 'soleil', 'table', 'univers', 'voyage', 'zebre', 'appel', 'bureau',
        
        # 7-8 character words (basic)
        'aventure', 'brillant', 'chanson', 'diamant', 'elephant', 'fleurir',
        'garden', 'harmonie', 'infini', 'journee', 'kilo', 'lampe', 'maison',
        'nature', 'ocean', 'paradis', 'qualite', 'reponse', 'soleil', 'table',
        'univers', 'voyage', 'zebre',
        
        # 7-8 character words (additional)
        'appetit', 'brillant', 'chanson', 'diamant', 'elephant', 'fleurir',
        'garden', 'harmonie', 'infini', 'journee', 'kilo', 'lampe', 'maison',
        'nature', 'ocean', 'paradis', 'qualite', 'reponse', 'soleil', 'table',
        'univers', 'voyage', 'zebre',
        
        # New words (3-4 characters)
        'arc', 'bleu', 'chat', 'dame', 'eau', 'fils', 'gout', 'haut', 'ici', 'jour',
        'lune', 'main', 'nuit', 'or', 'pain', 'rose', 'soleil', 'temps', 'un', 'vent',
        'zinc', 'ami', 'bleu', 'chat', 'dame', 'elle', 'fleur', 'gout', 'haut', 'jour',
        
        # New words (5-6 characters)
        'amour', 'belle', 'couleur', 'dormir', 'ecrire', 'fleur', 'garcon', 'hiver',
        'idee', 'journee', 'livre', 'maison', 'nature', 'orange', 'parler', 'quatre',
        'revoir', 'soleil', 'table', 'univers', 'voyage', 'zebre', 'appel', 'bureau',
        
        # New words (7-8 characters)
        'aventure', 'brillant', 'chanson', 'diamant', 'elephant', 'fleurir',
        'garden', 'harmonie', 'infini', 'journee', 'kilo', 'lampe', 'maison',
        'nature', 'ocean', 'paradis', 'qualite', 'reponse', 'soleil', 'table',
        # Add words with 10+ characters
        'fraise', 'pastèque', 'melon', 'myrtille',
        'framboise', 'mûre', 'groseille', 'sureau',
        'groseille à maquereau', 'myrtille', 'fraise', 'pastèque',
        'ananas', 'grenade', 'rhubarbe', 'fraise',
        'mandarine', 'pastèque', 'courgette', 'fraise',
        'pastèque', 'melon', 'myrtille', 'framboise',
        'mûre', 'groseille', 'sureau', 'groseille à maquereau',
        'myrtille', 'fraise', 'pastèque', 'ananas',
        'grenade', 'rhubarbe', 'fraise', 'mandarine',
        'pastèque', 'courgette', 'fraise', 'pastèque'
    ] if word.lower() not in NLTK_WORDS
]

# Polish word list (only non-overlapping with NLTK words)
POLISH_WORDS = [
    word for word in [
        # 3-4 character words (basic)
        'dom', 'kot', 'las', 'morze', 'noc', 'ogien', 'pies', 'ryba', 'slonce', 'trawa',
        'woda', 'zima', 'auto', 'brama', 'cukier', 'domek', 'ekran', 'fala', 'gara',
        'hala', 'igla', 'jablko', 'kawa', 'lampa', 'mama', 'noga', 'okno', 'praca',
        
        # 3-4 character words (additional)
        'bak', 'dak', 'eik', 'gat', 'hut', 'ijs', 'kas', 'lot', 'mat', 'net',
        'oog', 'pad', 'rok', 'sok', 'tak', 'uur', 'vat', 'wip', 'zak', 'zon',
        'aap', 'bal', 'dier', 'eend', 'fles', 'glas', 'haar', 'jurk', 'kast', 'lamp',
        
        # 5-6 character words (basic)
        'ksiazka', 'ludzie', 'morze', 'nocleg', 'ogrod', 'praca', 'rynek', 'slonce',
        'trawa', 'woda', 'zima', 'auto', 'brama', 'cukier', 'domek', 'ekran',
        'fala', 'gara', 'hala', 'igla', 'jablko', 'kawa', 'lampa', 'mama',
        
        # 5-6 character words (additional)
        'appel', 'beker', 'dakpan', 'eikels', 'flesje', 'gras', 'honing', 'jassen',
        'kastje', 'lampen', 'muziek', 'natuur', 'oogjes', 'pannen', 'raam', 'schoen',
        'tafel', 'uren', 'vriend', 'winkel', 'zomer', 'appel', 'beker', 'dakpan',
        
        # 7-8 character words (basic)
        'ksiazka', 'ludzie', 'morze', 'nocleg', 'ogrod', 'praca', 'rynek', 'slonce',
        'trawa', 'woda', 'zima', 'auto', 'brama', 'cukier', 'domek', 'ekran',
        'fala', 'gara', 'hala', 'igla', 'jablko', 'kawa', 'lampa', 'mama',
        
        # 7-8 character words (additional)
        'appetit', 'brillant', 'chanson', 'diamant', 'elephant', 'fleurir',
        'garden', 'harmonie', 'infini', 'journee', 'kilo', 'lampe', 'maison',
        'nature', 'ocean', 'paradis', 'qualite', 'reponse', 'soleil', 'table',
        'univers', 'voyage', 'zebre',
        
        # New words (3-4 characters)
        'bak', 'dak', 'eik', 'gat', 'hut', 'ijs', 'kas', 'lot', 'mat', 'net',
        'oog', 'pad', 'rok', 'sok', 'tak', 'uur', 'vat', 'wip', 'zak', 'zon',
        'aap', 'bal', 'dier', 'eend', 'fles', 'glas', 'haar', 'jurk', 'kast', 'lamp',
        
        # New words (5-6 characters)
        'ksiazka', 'ludzie', 'morze', 'nocleg', 'ogrod', 'praca', 'rynek', 'slonce',
        'trawa', 'woda', 'zima', 'auto', 'brama', 'cukier', 'domek', 'ekran',
        'fala', 'gara', 'hala', 'igla', 'jablko', 'kawa', 'lampa', 'mama',
        
        # New words (7-8 characters)
        'ksiazka', 'ludzie', 'morze', 'nocleg', 'ogrod', 'praca', 'rynek', 'slonce',
        'trawa', 'woda', 'zima', 'auto', 'brama', 'cukier', 'domek', 'ekran',
        'fala', 'gara', 'hala', 'igla', 'jablko', 'kawa', 'lampa', 'mama',
        # Add words with 10+ characters
        'truskawka', 'arbuz', 'melon', 'borówka',
        'malina', 'jeżyna', 'porzeczka', 'bez',
        'agrest', 'jagoda', 'truskawka', 'arbuz',
        'ananas', 'granat', 'rabarbar', 'truskawka',
        'mandarynka', 'arbuz', 'cukinia', 'truskawka',
        'arbuz', 'melon', 'borówka', 'malina',
        'jeżyna', 'porzeczka', 'bez', 'agrest',
        'jagoda', 'truskawka', 'arbuz', 'ananas',
        'granat', 'rabarbar', 'truskawka', 'mandarynka',
        'arbuz', 'cukinia', 'truskawka', 'arbuz'
    ] if word.lower() not in NLTK_WORDS
]

# Hungarian word list (only non-overlapping with NLTK words)
HUNGARIAN_WORDS = [
    word for word in [
        # 3-4 character words (basic)
        'agy', 'bor', 'cukor', 'dio', 'eg', 'fa', 'gitar', 'haz', 'ido', 'jeg',
        'kep', 'lab', 'mez', 'nap', 'or', 'pal', 'rak', 'sor', 'taj', 'uj',
        'var', 'zold', 'auto', 'boka', 'cipo', 'daru', 'eger', 'falu', 'golyo',
        
        # 3-4 character words (additional)
        'bak', 'dak', 'eik', 'gat', 'hut', 'ijs', 'kas', 'lot', 'mat', 'net',
        'oog', 'pad', 'rok', 'sok', 'tak', 'uur', 'vat', 'wip', 'zak', 'zon',
        'aap', 'bal', 'dier', 'eend', 'fles', 'glas', 'haar', 'jurk', 'kast', 'lamp',
        
        # 5-6 character words (basic)
        'ablak', 'bors', 'cukor', 'dohany', 'egres', 'fagylalt', 'gitar', 'haz',
        'ido', 'jeg', 'kep', 'lab', 'mez', 'nap', 'or', 'pal', 'rak', 'sor',
        'taj', 'uj', 'var', 'zold', 'auto', 'boka', 'cipo', 'daru',
        
        # 5-6 character words (additional)
        'appel', 'beker', 'dakpan', 'eikels', 'flesje', 'gras', 'honing', 'jassen',
        'kastje', 'lampen', 'muziek', 'natuur', 'oogjes', 'pannen', 'raam', 'schoen',
        'tafel', 'uren', 'vriend', 'winkel', 'zomer', 'appel', 'beker', 'dakpan',
        
        # 7-8 character words (basic)
        'ablak', 'bors', 'cukor', 'dohany', 'egres', 'fagylalt', 'gitar', 'haz',
        'ido', 'jeg', 'kep', 'lab', 'mez', 'nap', 'or', 'pal', 'rak', 'sor',
        'taj', 'uj', 'var', 'zold', 'auto', 'boka', 'cipo', 'daru',
        
        # 7-8 character words (additional)
        'appetit', 'brillant', 'chanson', 'diamant', 'elephant', 'fleurir',
        'garden', 'harmonie', 'infini', 'journee', 'kilo', 'lampe', 'maison',
        'nature', 'ocean', 'paradis', 'qualite', 'reponse', 'soleil', 'table',
        'univers', 'voyage', 'zebre',
        
        # New words (3-4 characters)
        'agy', 'bor', 'cukor', 'dio', 'eg', 'fa', 'gitar', 'haz', 'ido', 'jeg',
        'kep', 'lab', 'mez', 'nap', 'or', 'pal', 'rak', 'sor', 'taj', 'uj',
        'var', 'zold', 'auto', 'boka', 'cipo', 'daru', 'eger', 'falu', 'golyo',
        
        # New words (5-6 characters)
        'ablak', 'bors', 'cukor', 'dohany', 'egres', 'fagylalt', 'gitar', 'haz',
        'ido', 'jeg', 'kep', 'lab', 'mez', 'nap', 'or', 'pal', 'rak', 'sor',
        'taj', 'uj', 'var', 'zold', 'auto', 'boka', 'cipo', 'daru',
        
        # New words (7-8 characters)
        'ablak', 'bors', 'cukor', 'dohany', 'egres', 'fagylalt', 'gitar', 'haz',
        'ido', 'jeg', 'kep', 'lab', 'mez', 'nap', 'or', 'pal', 'rak', 'sor',
        'taj', 'uj', 'var', 'zold', 'auto', 'boka', 'cipo', 'daru',
        # Add words with 10+ characters
        'eper', 'görögdinnye', 'dinnye', 'áfonya',
        'málna', 'szeder', 'ribizli', 'bodza',
        'egres', 'áfonya', 'eper', 'görögdinnye',
        'ananász', 'gránátalma', 'rebarbara', 'eper',
        'mandarin', 'görögdinnye', 'cukkini', 'eper',
        'görögdinnye', 'dinnye', 'áfonya', 'málna',
        'szeder', 'ribizli', 'bodza', 'egres',
        'áfonya', 'eper', 'görögdinnye', 'ananász',
        'gránátalma', 'rebarbara', 'eper', 'mandarin',
        'görögdinnye', 'cukkini', 'eper', 'görögdinnye'
    ] if word.lower() not in NLTK_WORDS
]

# Swahili word list (only non-overlapping with NLTK words)
SWAHILI_WORDS = [
    word for word in [
        # 3-4 character words (basic)
        'ana', 'baba', 'chai', 'dada', 'embe', 'fura', 'gari', 'hali', 'jina', 'kazi',
        'lala', 'mama', 'nani', 'paka', 'rafiki', 'sana', 'tatu', 'uma', 'vita', 'wapi',
        'yeye', 'zuri', 'akili', 'bahari', 'chakula', 'dawa', 'elimu', 'furaha',
        
        # 3-4 character words (additional)
        'bak', 'dak', 'eik', 'gat', 'hut', 'ijs', 'kas', 'lot', 'mat', 'net',
        'oog', 'pad', 'rok', 'sok', 'tak', 'uur', 'vat', 'wip', 'zak', 'zon',
        'aap', 'bal', 'dier', 'eend', 'fles', 'glas', 'haar', 'jurk', 'kast', 'lamp',
        
        # 5-6 character words (basic)
        'asante', 'bahari', 'chakula', 'dawa', 'elimu', 'furaha', 'gari', 'hali',
        'jina', 'kazi', 'lala', 'mama', 'nani', 'paka', 'rafiki', 'sana', 'tatu',
        'uma', 'vita', 'wapi', 'yeye', 'zuri', 'akili', 'bahari', 'chakula',
        
        # 5-6 character words (additional)
        'appel', 'beker', 'dakpan', 'eikels', 'flesje', 'gras', 'honing', 'jassen',
        'kastje', 'lampen', 'muziek', 'natuur', 'oogjes', 'pannen', 'raam', 'schoen',
        'tafel', 'uren', 'vriend', 'winkel', 'zomer', 'appel', 'beker', 'dakpan',
        
        # 7-8 character words (basic)
        'asante', 'bahari', 'chakula', 'dawa', 'elimu', 'furaha', 'gari', 'hali',
        'jina', 'kazi', 'lala', 'mama', 'nani', 'paka', 'rafiki', 'sana', 'tatu',
        'uma', 'vita', 'wapi', 'yeye', 'zuri', 'akili', 'bahari', 'chakula',
        
        # 7-8 character words (additional)
        'appetit', 'brillant', 'chanson', 'diamant', 'elephant', 'fleurir',
        'garden', 'harmonie', 'infini', 'journee', 'kilo', 'lampe', 'maison',
        'nature', 'ocean', 'paradis', 'qualite', 'reponse', 'soleil', 'table',
        'univers', 'voyage', 'zebre',
        
        # New words (3-4 characters)
        'ana', 'baba', 'chai', 'dada', 'embe', 'fura', 'gari', 'hali', 'jina', 'kazi',
        'lala', 'mama', 'nani', 'paka', 'rafiki', 'sana', 'tatu', 'uma', 'vita', 'wapi',
        'yeye', 'zuri', 'akili', 'bahari', 'chakula', 'dawa', 'elimu', 'furaha',
        
        # New words (5-6 characters)
        'asante', 'bahari', 'chakula', 'dawa', 'elimu', 'furaha', 'gari', 'hali',
        'jina', 'kazi', 'lala', 'mama', 'nani', 'paka', 'rafiki', 'sana', 'tatu',
        'uma', 'vita', 'wapi', 'yeye', 'zuri', 'akili', 'bahari', 'chakula',
        
        # New words (7-8 characters)
        'asante', 'bahari', 'chakula', 'dawa', 'elimu', 'furaha', 'gari', 'hali',
        'jina', 'kazi', 'lala', 'mama', 'nani', 'paka', 'rafiki', 'sana', 'tatu',
        'uma', 'vita', 'wapi', 'yeye', 'zuri', 'akili', 'bahari', 'chakula',
        # Add words with 10+ characters
        'nanasi', 'komamanga', 'rabarba', 'strawberi',
        'mandarini', 'majani ya mboga', 'strawberi', 'tikiti maji',
        'bluberi', 'rasiberi', 'blackberi', 'mzabibu',
        'goziberi', 'strawberi', 'tikiti maji', 'nanasi',
        'komamanga', 'rabarba', 'strawberi', 'mandarini',
        'tikiti maji', 'majani ya mboga', 'strawberi', 'tikiti maji'
    ] if word.lower() not in NLTK_WORDS
]

# Romanized Japanese word list (only non-overlapping with NLTK words)
JAPANESE_WORDS = [
    word for word in [
        # 3-4 character words (basic)
        'ai', 'boku', 'chi', 'da', 'e', 'fu', 'ga', 'ha', 'i', 'ji',
        'ka', 'la', 'ma', 'na', 'o', 'pa', 'ra', 'sa', 'ta', 'u',
        'wa', 'ya', 'zo', 'aki', 'bara', 'chai', 'dai', 'eigo', 'fuji',
        
        # 3-4 character words (additional)
        'ame', 'bara', 'cha', 'dai', 'eiga', 'fuji', 'gaku', 'hana', 'ichi', 'jikan',
        'kami', 'luna', 'mizu', 'nami', 'otoko', 'panda', 'ringo', 'sakura', 'taiyo',
        'umi', 'washi', 'yama', 'zutto', 'akane', 'bara', 'chai', 'dai', 'eigo',
        
        # 5-6 character words (basic)
        'akane', 'bara', 'chai', 'dai', 'eigo', 'fuji', 'gaku', 'hashi',
        'ichi', 'jikan', 'kaze', 'luna', 'machi', 'natsu', 'otoko', 'panda',
        'ringo', 'sakura', 'taiyo', 'umi', 'washi', 'yama', 'zutto',
        
        # 5-6 character words (additional)
        'akane', 'bara', 'chai', 'dai', 'eigo', 'fuji', 'gaku', 'hashi',
        'ichi', 'jikan', 'kaze', 'luna', 'machi', 'natsu', 'otoko', 'panda',
        'ringo', 'sakura', 'taiyo', 'umi', 'washi', 'yama', 'zutto',
        
        # 7-8 character words (basic)
        'akane', 'bara', 'chai', 'dai', 'eigo', 'fuji', 'gaku', 'hashi',
        'ichi', 'jikan', 'kaze', 'luna', 'machi', 'natsu', 'otoko', 'panda',
        'ringo', 'sakura', 'taiyo', 'umi', 'washi', 'yama', 'zutto',
        
        # 7-8 character words (additional)
        'akane', 'bara', 'chai', 'dai', 'eigo', 'fuji', 'gaku', 'hashi',
        'ichi', 'jikan', 'kaze', 'luna', 'machi', 'natsu', 'otoko', 'panda',
        'ringo', 'sakura', 'taiyo', 'umi', 'washi', 'yama', 'zutto',
        
        # New words (3-4 characters)
        'ai', 'boku', 'chi', 'da', 'e', 'fu', 'ga', 'ha', 'i', 'ji',
        'ka', 'la', 'ma', 'na', 'o', 'pa', 'ra', 'sa', 'ta', 'u',
        'wa', 'ya', 'zo', 'aki', 'bara', 'chai', 'dai', 'eigo', 'fuji',
        
        # New words (5-6 characters)
        'akane', 'bara', 'chai', 'dai', 'eigo', 'fuji', 'gaku', 'hashi',
        'ichi', 'jikan', 'kaze', 'luna', 'machi', 'natsu', 'otoko', 'panda',
        'ringo', 'sakura', 'taiyo', 'umi', 'washi', 'yama', 'zutto',
        
        # New words (7-8 characters)
        'akane', 'bara', 'chai', 'dai', 'eigo', 'fuji', 'gaku', 'hashi',
        'ichi', 'jikan', 'kaze', 'luna', 'machi', 'natsu', 'otoko', 'panda',
        'ringo', 'sakura', 'taiyo', 'umi', 'washi', 'yama', 'zutto',
        # Add words with 10+ characters
        'ichigo', 'suika', 'meron', 'aoichigo',
        'ichigo', 'kuroichigo', 'kurantsuberi', 'niwatoko',
        'guzuberi', 'aoichigo', 'ichigo', 'suika',
        'painappuru', 'zakuro', 'ruibarubu', 'ichigo',
        'mikan', 'suika', 'zukkini', 'ichigo',
        'suika', 'meron', 'aoichigo', 'ichigo',
        'kuroichigo', 'kurantsuberi', 'niwatoko', 'guzuberi',
        'aoichigo', 'ichigo', 'suika', 'painappuru',
        'zakuro', 'ruibarubu', 'ichigo', 'mikan',
        'suika', 'zukkini', 'ichigo', 'suika'
    ] if word.lower() not in NLTK_WORDS
]

# TLD list
TLDS = [
    # Common TLDs
    '.com', '.net', '.org', '.io', '.co', '.jp', '.uk', '.de', '.fr', '.ru',
    '.info', '.biz', '.mobi', '.tv', '.me', '.cc', '.xyz', '.site',
]


# Numeric substitution neologism list
LEETSPEAK_WORDS = [
    word for word in [
        # Basic substitution patterns
        '4rt', 'b0x', 'c4t', 'd0g', '3gg', 'f0x', 'h4t', '1c3', 'j4m', 'k3y',
        'l0g', 'm4p', 'n3t', '01l', 'p3n', 'r4t', '5un', 't34', 'u53', 'v4n',
        'w3b', 'y35', 'z1p', '41r', 'bu5', 'cu7', 'd4y', '3y3', 'fly', 'g45',
        
        # Technical word substitutions
        '4p1', 'b3t4', 'c0d3', 'd4t4', '3ch0', 'f14sh', 'g4mm4', 'h05t',
        '1npu7', 'jump', 'k3rn3l', 'l0g1c', 'm47r1x', 'n0d3', '0u7pu7', 'pr0xy',
        'qu3ry', 'r0u73r', '53rv3r', '74rg37', 'upd473', 'v3c70r', 'w1nd0w',
        
        # Common word substitutions
        '4c3', 'b4d', 'c0w', 'dry', '3nd', 'f17', 'g4p', 'h17', 'j37', 'k17',
        'l0w', 'm1x', 'n3w', '0dd', 'p4y', 'r4w', '537', '7ry', 'u53', 'v14',
        'w4y', 'y35', 'z4p', '4c7', 'b1g', 'cu7', 'd1g', '347', 'f1x', 'g37',
        
        # Longer word substitutions
        '4ppl3', 'b34ch', 'cl0ud', 'dr34m', '34r7h', 'f13ld', 'gr33n', 'h0u53',
        '15l4nd', 'j3lly', 'kn1f3', 'l1gh7', 'mu51c', 'n1gh7', '0c34n', 'p4p3r',
        'qu33n', 'r1v3r', '57on3', '74bl3', 'umbr3ll4', 'v01c3', 'w473r',
        
        # Technical neologism substitutions
        '4dv4nc3d', 'br0w53r', 'c0mpu73r', 'd474b453', '3ncryp7', 'f1r3w4ll',
        'g473w4y', 'h4rdw4r3', '1n73rn37', 'jun7ion', 'k3yb04rd', 'l4ngu4g3',
        'm0n17or', 'n37w0rk', '0p3r470r', 'pr070col', 'qu4n7um', 'r34l71m3'
    ] if word.lower() not in NLTK_WORDS
]

def corrupt_word(word):
    if not word: return word
    idx = random.randint(0, len(word) - 1)
    replacement = random.choice([c for c in string.ascii_lowercase if c != word[idx].lower()])
    return word[:idx] + replacement + word[idx+1:]

# Incorrect word list (words with one character different from ENGLISH_WORDS)
MISSPELLED_WORDS = [
    corrupt_word(word) for word in ENGLISH_WORDS
    if corrupt_word(word).lower() not in NLTK_WORDS
]

# print(len(ENGLISH_WORDS))
# print(len(GERMAN_WORDS))
# print(len(POLISH_WORDS))
# print(len(HUNGARIAN_WORDS))
# print(len(SWAHILI_WORDS))
# print(len(JAPANESE_WORDS))
# print(len(DUTCH_WORDS))
# print(len(FRENCH_WORDS))
# print(len(CONSONANT_WORDS))
# print(len(LEETSPEAK_WORDS))
# print(len(MISSPELLED_WORDS))
# print(len(SHUFFLED_ENGLISH_WORDS))

print(SHUFFLED_ENGLISH_WORDS)