See мужик in All languages combined, or Wiktionary
{ "derived": [ { "_dis1": "0 0 0 0 0 0 0", "roman": "mužíčka", "word": "мужи́чка" }, { "_dis1": "0 0 0 0 0 0 0", "roman": "mužičʹjó", "word": "мужичьё" } ], "descendants": [ { "depth": 1, "templates": [ { "args": { "1": "hy", "2": "մուժիկ", "bor": "1" }, "expansion": "→ Armenian: մուժիկ (mužik)", "name": "desc" } ], "text": "→ Armenian: մուժիկ (mužik)" }, { "depth": 1, "templates": [ { "args": { "1": "az", "2": "mujik", "bor": "1" }, "expansion": "→ Azerbaijani: mujik", "name": "desc" } ], "text": "→ Azerbaijani: mujik" }, { "depth": 1, "templates": [ { "args": { "1": "fa", "2": "موژیک", "bor": "1", "tr": "mužik" }, "expansion": "→ Persian: موژیک (mužik)", "name": "desc" } ], "text": "→ Persian: موژیک (mužik)" }, { "depth": 1, "templates": [ { "args": { "1": "en", "2": "mujik", "3": "muzhik", "bor": "1" }, "expansion": "→ English: mujik, muzhik", "name": "desc" } ], "text": "→ English: mujik, muzhik" }, { "depth": 1, "templates": [ { "args": { "1": "fr", "2": "moujik", "bor": "1" }, "expansion": "→ French: moujik", "name": "desc" } ], "text": "→ French: moujik" }, { "depth": 1, "templates": [ { "args": { "1": "ka", "2": "მუჯიკი", "bor": "1" }, "expansion": "→ Georgian: მუჯიკი (muǯiḳi)", "name": "desc" } ], "text": "→ Georgian: მუჯიკი (muǯiḳi)" }, { "depth": 1, "templates": [ { "args": { "1": "de", "2": "Muschik", "3": "Mushik", "bor": "1" }, "expansion": "→ German: Muschik, Mushik", "name": "desc" } ], "text": "→ German: Muschik, Mushik" }, { "depth": 1, "templates": [ { "args": { "1": "pl", "2": "mużyk", "bor": "1" }, "expansion": "→ Polish: mużyk", "name": "desc" } ], "text": "→ Polish: mużyk" }, { "depth": 1, "templates": [ { "args": { "1": "uby", "2": "мыжыӄ", "bor": "1" }, "expansion": "→ Ubykh: мыжыӄ (məẑəq)", "name": "desc" } ], "text": "→ Ubykh: мыжыӄ (məẑəq)" } ], "etymology_templates": [ { "args": { "1": "ru", "2": "муж", "3": "-ик", "t1": "man (dated); husband" }, "expansion": "муж (muž, “man (dated); husband”) + -ик (-ik)", "name": "af" } ], "etymology_text": "From муж (muž, “man (dated); husband”) + -ик (-ik).", "forms": [ { "form": "мужи́к", "tags": [ "canonical" ] }, { "form": "mužík", "tags": [ "romanization" ] }, { "form": "мужика́", "tags": [ "genitive" ] }, { "form": "мужики́", "tags": [ "nominative", "plural" ] }, { "form": "мужико́в", "tags": [ "genitive", "plural" ] }, { "form": "мужи́цкий", "tags": [ "adjective", "relational" ] }, { "form": "мужи́чий", "tags": [ "adjective", "relational" ] }, { "form": "мужичо́к", "tags": [ "diminutive" ] }, { "form": "мужичи́ще", "tags": [ "augmentative" ] }, { "form": "мужичо́нка", "tags": [ "pejorative" ] }, { "form": "мужичи́шка", "tags": [ "pejorative" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "ru-noun-table", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "velar-stem", "source": "declension", "tags": [ "class" ] }, { "form": "accent-b", "source": "declension", "tags": [ "class" ] }, { "form": "мужи́к", "roman": "mužík", "source": "declension", "tags": [ "nominative", "singular" ] }, { "form": "мужики́", "roman": "mužikí", "source": "declension", "tags": [ "nominative", "plural" ] }, { "form": "мужика́", "roman": "mužiká", "source": "declension", "tags": [ "genitive", "singular" ] }, { "form": "мужико́в", "roman": "mužikóv", "source": "declension", "tags": [ "genitive", "plural" ] }, { "form": "мужику́", "roman": "mužikú", "source": "declension", "tags": [ "dative", "singular" ] }, { "form": "мужика́м", "roman": "mužikám", "source": "declension", "tags": [ "dative", "plural" ] }, { "form": "мужика́", "roman": "mužiká", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "мужико́в", "roman": "mužikóv", "source": "declension", "tags": [ "accusative", "plural" ] }, { "form": "мужико́м", "roman": "mužikóm", "source": "declension", "tags": [ "instrumental", "singular" ] }, { "form": "мужика́ми", "roman": "mužikámi", "source": "declension", "tags": [ "instrumental", "plural" ] }, { "form": "мужике́", "roman": "mužiké", "source": "declension", "tags": [ "prepositional", "singular" ] }, { "form": "мужика́х", "roman": "mužikáx", "source": "declension", "tags": [ "plural", "prepositional" ] } ], "head_templates": [ { "args": { "1": "b", "2": "мужи́к", "a": "an", "adj": "мужи́цкий", "adj2": "мужи́чий", "aug": "мужичи́ще", "dim": "мужичо́к", "pej": "мужичо́нка", "pej2": "мужичи́шка" }, "expansion": "мужи́к • (mužík) m anim (genitive мужика́, nominative plural мужики́, genitive plural мужико́в, relational adjective мужи́цкий or мужи́чий, diminutive мужичо́к, augmentative мужичи́ще, pejorative мужичо́нка or мужичи́шка)", "name": "ru-noun+" } ], "lang": "Russian", "lang_code": "ru", "pos": "noun", "senses": [ { "antonyms": [ { "word": "ба́ба" } ], "categories": [ { "_dis": "32 0 24 10 11 14 9", "kind": "topical", "langcode": "ru", "name": "Male people", "orig": "ru:Male people", "parents": [ "Male", "People", "Gender", "Human", "Biology", "Psychology", "Sociology", "All topics", "Sciences", "Social sciences", "Fundamental", "Society" ], "source": "w+disamb" } ], "glosses": [ "man (male person); (UK) bloke, (US) dude, fella, guy" ], "id": "en-мужик-ru-noun-tS1NJxte", "links": [ [ "colloquial", "colloquial#English" ], [ "man", "man" ], [ "bloke", "bloke" ], [ "dude", "dude" ], [ "fella", "fella" ], [ "guy", "guy" ] ], "qualifier": "low colloquial", "raw_glosses": [ "(low colloquial) man (male person); (UK) bloke, (US) dude, fella, guy" ], "synonyms": [ { "word": "мужчи́на" } ] }, { "categories": [], "glosses": [ "husband" ], "id": "en-мужик-ru-noun-n-6PiLk6", "links": [ [ "husband", "husband" ] ], "raw_glosses": [ "(colloquial) husband" ], "synonyms": [ { "word": "муж" }, { "word": "супру́г" } ], "tags": [ "colloquial" ] }, { "categories": [ { "_dis": "2 1 31 34 2 14 16", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "2 1 31 34 2 17 14", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "3 0 28 32 6 16 14", "kind": "other", "name": "Russian entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "4 1 23 27 8 21 17", "kind": "other", "name": "Russian links with redundant wikilinks", "parents": [ "Links with redundant wikilinks", "Entry maintenance" ], "source": "w+disamb" } ], "glosses": [ "a man as a bearer of masculine qualities; man, macho man, real man" ], "id": "en-мужик-ru-noun-RM5ivXbv", "links": [ [ "man", "man" ], [ "macho man", "macho man" ], [ "real", "real" ] ], "qualifier": "approving", "raw_glosses": [ "(colloquial, approving) a man as a bearer of masculine qualities; man, macho man, real man" ], "synonyms": [ { "word": "ма́чо" }, { "word": "мужла́н" } ], "tags": [ "colloquial" ] }, { "categories": [ { "_dis": "2 1 31 34 2 14 16", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "2 1 31 34 2 17 14", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "3 0 28 32 6 16 14", "kind": "other", "name": "Russian entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "4 1 23 27 8 21 17", "kind": "other", "name": "Russian links with redundant wikilinks", "parents": [ "Links with redundant wikilinks", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "13 10 13 26 10 10 19", "kind": "other", "name": "Russian nouns with accent pattern b", "parents": [], "source": "w+disamb" }, { "_dis": "1 1 18 48 3 16 12", "kind": "other", "name": "Russian terms of address", "parents": [ "Terms of address", "Terms by usage" ], "source": "w+disamb" }, { "_dis": "3 2 19 34 6 19 17", "kind": "other", "name": "Russian terms suffixed with -ик", "parents": [], "source": "w+disamb" } ], "examples": [ { "english": "Listen, men!", "roman": "Poslúšajte, mužikí!", "text": "Послу́шайте, мужики́!", "type": "example" } ], "glosses": [ "Term of address for men to each other" ], "id": "en-мужик-ru-noun-sCVOdvy-", "links": [ [ "Term of address", "term of address#English" ] ], "raw_glosses": [ "(colloquial) Term of address for men to each other" ], "tags": [ "colloquial" ] }, { "categories": [], "glosses": [ "coarse, uncouth man; boor" ], "id": "en-мужик-ru-noun-~FTFOH3R", "links": [ [ "vernacular", "vernacular#English" ], [ "coarse", "coarse" ], [ "uncouth", "uncouth" ], [ "boor", "boor" ] ], "qualifier": "rude", "raw_glosses": [ "(rude, archaic, vernacular) coarse, uncouth man; boor" ], "synonyms": [ { "word": "мужла́н" } ], "tags": [ "archaic", "vernacular" ] }, { "categories": [ { "_dis": "2 1 31 34 2 14 16", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "2 1 31 34 2 17 14", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "3 0 28 32 6 16 14", "kind": "other", "name": "Russian entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "4 1 23 27 8 21 17", "kind": "other", "name": "Russian links with redundant wikilinks", "parents": [ "Links with redundant wikilinks", "Entry maintenance" ], "source": "w+disamb" } ], "glosses": [ "commoner, peasant; mujik/muzhik" ], "id": "en-мужик-ru-noun-SL7WbNAY", "links": [ [ "commoner", "commoner" ], [ "peasant", "peasant" ], [ "mujik", "mujik" ], [ "muzhik", "muzhik" ] ], "qualifier": "Tsarist Russia", "raw_glosses": [ "(historical, Tsarist Russia) commoner, peasant; mujik/muzhik" ], "synonyms": [ { "word": "крестья́нин" }, { "word": "простолюди́н" } ], "tags": [ "historical" ] }, { "categories": [ { "kind": "topical", "langcode": "ru", "name": "Crime", "orig": "ru:Crime", "parents": [ "Criminal law", "Society", "Law", "All topics", "Justice", "Fundamental" ], "source": "w" }, { "_dis": "2 1 31 34 2 14 16", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "2 1 31 34 2 17 14", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "3 0 28 32 6 16 14", "kind": "other", "name": "Russian entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "4 1 23 27 8 21 17", "kind": "other", "name": "Russian links with redundant wikilinks", "parents": [ "Links with redundant wikilinks", "Entry maintenance" ], "source": "w+disamb" } ], "glosses": [ "ordinary convict working conscientiously in a prison camp" ], "id": "en-мужик-ru-noun-toNHVlCv", "links": [ [ "criminal", "criminal" ], [ "slang", "slang" ], [ "convict", "convict" ] ], "raw_glosses": [ "(criminal slang) ordinary convict working conscientiously in a prison camp" ], "tags": [ "slang" ] } ], "sounds": [ { "ipa": "[mʊˈʐɨk]" }, { "audio": "Ru-мужик.ogg", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/2/23/Ru-%D0%BC%D1%83%D0%B6%D0%B8%D0%BA.ogg/Ru-%D0%BC%D1%83%D0%B6%D0%B8%D0%BA.ogg.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/2/23/Ru-%D0%BC%D1%83%D0%B6%D0%B8%D0%BA.ogg" } ], "synonyms": [ { "_dis1": "0 0 0 0 0 0 0", "roman": "mužík", "word": "мужи́къ — Pre-reform orthography (1918)" } ], "word": "мужик" }
{ "categories": [ "Pages with 1 entry", "Pages with entries", "Russian 2-syllable words", "Russian animate nouns", "Russian entries with incorrect language header", "Russian lemmas", "Russian links with redundant wikilinks", "Russian masculine nouns", "Russian nouns", "Russian nouns with accent pattern b", "Russian terms of address", "Russian terms suffixed with -ик", "Russian terms with IPA pronunciation", "Russian velar-stem masculine-form accent-b nouns", "Russian velar-stem masculine-form nouns", "ru:Male people" ], "derived": [ { "roman": "mužíčka", "word": "мужи́чка" }, { "roman": "mužičʹjó", "word": "мужичьё" } ], "descendants": [ { "depth": 1, "templates": [ { "args": { "1": "hy", "2": "մուժիկ", "bor": "1" }, "expansion": "→ Armenian: մուժիկ (mužik)", "name": "desc" } ], "text": "→ Armenian: մուժիկ (mužik)" }, { "depth": 1, "templates": [ { "args": { "1": "az", "2": "mujik", "bor": "1" }, "expansion": "→ Azerbaijani: mujik", "name": "desc" } ], "text": "→ Azerbaijani: mujik" }, { "depth": 1, "templates": [ { "args": { "1": "fa", "2": "موژیک", "bor": "1", "tr": "mužik" }, "expansion": "→ Persian: موژیک (mužik)", "name": "desc" } ], "text": "→ Persian: موژیک (mužik)" }, { "depth": 1, "templates": [ { "args": { "1": "en", "2": "mujik", "3": "muzhik", "bor": "1" }, "expansion": "→ English: mujik, muzhik", "name": "desc" } ], "text": "→ English: mujik, muzhik" }, { "depth": 1, "templates": [ { "args": { "1": "fr", "2": "moujik", "bor": "1" }, "expansion": "→ French: moujik", "name": "desc" } ], "text": "→ French: moujik" }, { "depth": 1, "templates": [ { "args": { "1": "ka", "2": "მუჯიკი", "bor": "1" }, "expansion": "→ Georgian: მუჯიკი (muǯiḳi)", "name": "desc" } ], "text": "→ Georgian: მუჯიკი (muǯiḳi)" }, { "depth": 1, "templates": [ { "args": { "1": "de", "2": "Muschik", "3": "Mushik", "bor": "1" }, "expansion": "→ German: Muschik, Mushik", "name": "desc" } ], "text": "→ German: Muschik, Mushik" }, { "depth": 1, "templates": [ { "args": { "1": "pl", "2": "mużyk", "bor": "1" }, "expansion": "→ Polish: mużyk", "name": "desc" } ], "text": "→ Polish: mużyk" }, { "depth": 1, "templates": [ { "args": { "1": "uby", "2": "мыжыӄ", "bor": "1" }, "expansion": "→ Ubykh: мыжыӄ (məẑəq)", "name": "desc" } ], "text": "→ Ubykh: мыжыӄ (məẑəq)" } ], "etymology_templates": [ { "args": { "1": "ru", "2": "муж", "3": "-ик", "t1": "man (dated); husband" }, "expansion": "муж (muž, “man (dated); husband”) + -ик (-ik)", "name": "af" } ], "etymology_text": "From муж (muž, “man (dated); husband”) + -ик (-ik).", "forms": [ { "form": "мужи́к", "tags": [ "canonical" ] }, { "form": "mužík", "tags": [ "romanization" ] }, { "form": "мужика́", "tags": [ "genitive" ] }, { "form": "мужики́", "tags": [ "nominative", "plural" ] }, { "form": "мужико́в", "tags": [ "genitive", "plural" ] }, { "form": "мужи́цкий", "tags": [ "adjective", "relational" ] }, { "form": "мужи́чий", "tags": [ "adjective", "relational" ] }, { "form": "мужичо́к", "tags": [ "diminutive" ] }, { "form": "мужичи́ще", "tags": [ "augmentative" ] }, { "form": "мужичо́нка", "tags": [ "pejorative" ] }, { "form": "мужичи́шка", "tags": [ "pejorative" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "ru-noun-table", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "velar-stem", "source": "declension", "tags": [ "class" ] }, { "form": "accent-b", "source": "declension", "tags": [ "class" ] }, { "form": "мужи́к", "roman": "mužík", "source": "declension", "tags": [ "nominative", "singular" ] }, { "form": "мужики́", "roman": "mužikí", "source": "declension", "tags": [ "nominative", "plural" ] }, { "form": "мужика́", "roman": "mužiká", "source": "declension", "tags": [ "genitive", "singular" ] }, { "form": "мужико́в", "roman": "mužikóv", "source": "declension", "tags": [ "genitive", "plural" ] }, { "form": "мужику́", "roman": "mužikú", "source": "declension", "tags": [ "dative", "singular" ] }, { "form": "мужика́м", "roman": "mužikám", "source": "declension", "tags": [ "dative", "plural" ] }, { "form": "мужика́", "roman": "mužiká", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "мужико́в", "roman": "mužikóv", "source": "declension", "tags": [ "accusative", "plural" ] }, { "form": "мужико́м", "roman": "mužikóm", "source": "declension", "tags": [ "instrumental", "singular" ] }, { "form": "мужика́ми", "roman": "mužikámi", "source": "declension", "tags": [ "instrumental", "plural" ] }, { "form": "мужике́", "roman": "mužiké", "source": "declension", "tags": [ "prepositional", "singular" ] }, { "form": "мужика́х", "roman": "mužikáx", "source": "declension", "tags": [ "plural", "prepositional" ] } ], "head_templates": [ { "args": { "1": "b", "2": "мужи́к", "a": "an", "adj": "мужи́цкий", "adj2": "мужи́чий", "aug": "мужичи́ще", "dim": "мужичо́к", "pej": "мужичо́нка", "pej2": "мужичи́шка" }, "expansion": "мужи́к • (mužík) m anim (genitive мужика́, nominative plural мужики́, genitive plural мужико́в, relational adjective мужи́цкий or мужи́чий, diminutive мужичо́к, augmentative мужичи́ще, pejorative мужичо́нка or мужичи́шка)", "name": "ru-noun+" } ], "lang": "Russian", "lang_code": "ru", "pos": "noun", "senses": [ { "antonyms": [ { "word": "ба́ба" } ], "glosses": [ "man (male person); (UK) bloke, (US) dude, fella, guy" ], "links": [ [ "colloquial", "colloquial#English" ], [ "man", "man" ], [ "bloke", "bloke" ], [ "dude", "dude" ], [ "fella", "fella" ], [ "guy", "guy" ] ], "qualifier": "low colloquial", "raw_glosses": [ "(low colloquial) man (male person); (UK) bloke, (US) dude, fella, guy" ], "synonyms": [ { "word": "мужчи́на" } ] }, { "categories": [ "Russian colloquialisms" ], "glosses": [ "husband" ], "links": [ [ "husband", "husband" ] ], "raw_glosses": [ "(colloquial) husband" ], "synonyms": [ { "word": "муж" }, { "word": "супру́г" } ], "tags": [ "colloquial" ] }, { "categories": [ "Russian colloquialisms" ], "glosses": [ "a man as a bearer of masculine qualities; man, macho man, real man" ], "links": [ [ "man", "man" ], [ "macho man", "macho man" ], [ "real", "real" ] ], "qualifier": "approving", "raw_glosses": [ "(colloquial, approving) a man as a bearer of masculine qualities; man, macho man, real man" ], "synonyms": [ { "word": "ма́чо" }, { "word": "мужла́н" } ], "tags": [ "colloquial" ] }, { "categories": [ "Russian colloquialisms", "Russian terms with usage examples" ], "examples": [ { "english": "Listen, men!", "roman": "Poslúšajte, mužikí!", "text": "Послу́шайте, мужики́!", "type": "example" } ], "glosses": [ "Term of address for men to each other" ], "links": [ [ "Term of address", "term of address#English" ] ], "raw_glosses": [ "(colloquial) Term of address for men to each other" ], "tags": [ "colloquial" ] }, { "categories": [ "Russian terms with archaic senses" ], "glosses": [ "coarse, uncouth man; boor" ], "links": [ [ "vernacular", "vernacular#English" ], [ "coarse", "coarse" ], [ "uncouth", "uncouth" ], [ "boor", "boor" ] ], "qualifier": "rude", "raw_glosses": [ "(rude, archaic, vernacular) coarse, uncouth man; boor" ], "synonyms": [ { "word": "мужла́н" } ], "tags": [ "archaic", "vernacular" ] }, { "categories": [ "Russian terms with historical senses" ], "glosses": [ "commoner, peasant; mujik/muzhik" ], "links": [ [ "commoner", "commoner" ], [ "peasant", "peasant" ], [ "mujik", "mujik" ], [ "muzhik", "muzhik" ] ], "qualifier": "Tsarist Russia", "raw_glosses": [ "(historical, Tsarist Russia) commoner, peasant; mujik/muzhik" ], "synonyms": [ { "word": "крестья́нин" }, { "word": "простолюди́н" } ], "tags": [ "historical" ] }, { "categories": [ "Russian criminal slang", "ru:Crime" ], "glosses": [ "ordinary convict working conscientiously in a prison camp" ], "links": [ [ "criminal", "criminal" ], [ "slang", "slang" ], [ "convict", "convict" ] ], "raw_glosses": [ "(criminal slang) ordinary convict working conscientiously in a prison camp" ], "tags": [ "slang" ] } ], "sounds": [ { "ipa": "[mʊˈʐɨk]" }, { "audio": "Ru-мужик.ogg", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/2/23/Ru-%D0%BC%D1%83%D0%B6%D0%B8%D0%BA.ogg/Ru-%D0%BC%D1%83%D0%B6%D0%B8%D0%BA.ogg.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/2/23/Ru-%D0%BC%D1%83%D0%B6%D0%B8%D0%BA.ogg" } ], "synonyms": [ { "roman": "mužík", "word": "мужи́къ — Pre-reform orthography (1918)" } ], "word": "мужик" }
Download raw JSONL data for мужик meaning in Russian (8.4kB)
This page is a part of the kaikki.org machine-readable Russian dictionary. This dictionary is based on structured data extracted on 2024-11-06 from the enwiktionary dump dated 2024-10-02 using wiktextract (fbeafe8 and 7f03c9b). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.