See sukun on Wiktionary
{ "etymology_templates": [ { "args": { "1": "en", "2": "ar", "3": "سُكُون" }, "expansion": "Borrowed from Arabic سُكُون (sukūn)", "name": "bor+" }, { "args": { "1": "en", "2": "ar", "3": "س ك ن" }, "expansion": "", "name": "root" } ], "etymology_text": "Borrowed from Arabic سُكُون (sukūn).", "forms": [ { "form": "sukuns", "tags": [ "plural" ] }, { "form": "sukkun", "tags": [ "alternative" ] }, { "form": "sukūn", "tags": [ "alternative" ] } ], "head_templates": [ { "args": {}, "expansion": "sukun (plural sukuns)", "name": "en-noun" } ], "lang": "English", "lang_code": "en", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "English entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Entries with translation boxes", "parents": [], "source": "w" }, { "kind": "other", "name": "Hindi terms with non-redundant manual transliterations", "parents": [ "Terms with non-redundant manual transliterations", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Pages with 6 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Arabic translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Azerbaijani translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Central Kurdish translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with French translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with German translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Hindi translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Japanese translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Kazakh translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Korean translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Malay translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Mandarin translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Northern Kurdish translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Pashto translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Persian translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Russian translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Tajik translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Turkish translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Urdu translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Terms with Uzbek translations", "parents": [], "source": "w" }, { "kind": "other", "name": "Undetermined terms with redundant script codes", "parents": [ "Terms with redundant script codes", "Entry maintenance" ], "source": "w" }, { "kind": "topical", "langcode": "en", "name": "Arabic letter names", "orig": "en:Arabic letter names", "parents": [ "Letter names", "Letters, symbols, and punctuation", "Names", "Orthography", "All topics", "Proper nouns", "Terms by semantic function", "Writing", "Fundamental", "Nouns", "Human behaviour", "Language", "Lemmas", "Human", "Communication" ], "source": "w" }, { "kind": "topical", "langcode": "en", "name": "Diacritical marks", "orig": "en:Diacritical marks", "parents": [ "Letters, symbols, and punctuation", "Symbols", "Orthography", "Writing", "Human behaviour", "Language", "Human", "Communication", "All topics", "Fundamental" ], "source": "w" } ], "examples": [ { "text": "Near-synonyms: virama, halant" } ], "glosses": [ "A diacritic (ـْ) used in the Arabic abjad to mark the absence of a vowel." ], "id": "en-sukun-en-noun-WBXlKiT1", "links": [ [ "diacritic", "diacritic" ], [ "ـْ", "ـْ" ], [ "abjad", "abjad" ] ], "related": [ { "word": "damma" }, { "word": "ḍamma" }, { "word": "fatha" }, { "word": "fatḥa" }, { "word": "kasra" }, { "word": "shadda" }, { "word": "šadda" }, { "word": "tashkil" }, { "word": "taškīl" } ], "translations": [ { "code": "ar", "lang": "Arabic", "roman": "sukūn", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "سُكُون" }, { "code": "az", "lang": "Azerbaijani", "sense": "Diacritic used to mark the absence of a vowel", "word": "sukuun" }, { "code": "cmn", "lang": "Chinese Mandarin", "roman": "jìngfú", "sense": "Diacritic used to mark the absence of a vowel", "word": "靜符 /静符" }, { "code": "fr", "lang": "French", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "feminine", "masculine" ], "word": "soukoun" }, { "code": "de", "lang": "German", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "neuter" ], "word": "Sukun" }, { "code": "hi", "lang": "Hindi", "roman": "jazm", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "जज़्म" }, { "code": "ja", "lang": "Japanese", "roman": "sukūn", "sense": "Diacritic used to mark the absence of a vowel", "word": "スクーン" }, { "code": "kk", "lang": "Kazakh", "roman": "sukun", "sense": "Diacritic used to mark the absence of a vowel", "word": "сукун" }, { "code": "ko", "lang": "Korean", "roman": "sukun", "sense": "Diacritic used to mark the absence of a vowel", "word": "수쿤" }, { "code": "ckb", "lang": "Central Kurdish", "roman": "zene", "sense": "Diacritic used to mark the absence of a vowel", "word": "زەنە" }, { "code": "kmr", "lang": "Northern Kurdish", "sense": "Diacritic used to mark the absence of a vowel", "word": "sikûn" }, { "code": "ms", "lang": "Malay", "sense": "Diacritic used to mark the absence of a vowel", "word": "baris mati" }, { "code": "ms", "lang": "Malay", "sense": "Diacritic used to mark the absence of a vowel", "word": "tanda mati" }, { "code": "ms", "lang": "Malay", "sense": "Diacritic used to mark the absence of a vowel", "word": "sukun" }, { "code": "ps", "lang": "Pashto", "roman": "sokun", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "سکون" }, { "code": "fa-ira", "lang": "Iranian Persian", "roman": "jazm", "sense": "Diacritic used to mark the absence of a vowel", "word": "جَزْم" }, { "code": "fa-ira", "lang": "Iranian Persian", "roman": "sâken", "sense": "Diacritic used to mark the absence of a vowel", "word": "ساکِن" }, { "code": "fa-ira", "lang": "Iranian Persian", "roman": "sokun", "sense": "Diacritic used to mark the absence of a vowel", "word": "سُکون" }, { "code": "ru", "lang": "Russian", "roman": "sukún", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "суку́н" }, { "code": "tg", "lang": "Tajik", "roman": "sukun", "sense": "Diacritic used to mark the absence of a vowel", "word": "сукун" }, { "code": "tg", "lang": "Tajik", "roman": "jazm", "sense": "Diacritic used to mark the absence of a vowel", "word": "ҷазм" }, { "code": "tr", "lang": "Turkish", "sense": "Diacritic used to mark the absence of a vowel", "word": "sükûn" }, { "code": "tr", "lang": "Turkish", "sense": "Diacritic used to mark the absence of a vowel", "word": "cezm" }, { "code": "ur", "lang": "Urdu", "roman": "jazm", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "جَزْم" }, { "code": "uz", "lang": "Uzbek", "sense": "Diacritic used to mark the absence of a vowel", "word": "sukun" }, { "code": "uz", "lang": "Uzbek", "sense": "Diacritic used to mark the absence of a vowel", "word": "jazm" } ], "wikipedia": [ "Arabic diacritics#Sukūn" ] } ], "word": "sukun" } { "forms": [ { "form": "súkun", "tags": [ "canonical" ] } ], "head_templates": [ { "args": { "1": "aof", "2": "noun", "head": "súkun" }, "expansion": "súkun", "name": "head" } ], "lang": "Bragat", "lang_code": "aof", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Bragat entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Pages with 6 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" } ], "glosses": [ "water" ], "id": "en-sukun-aof-noun-D0FoSQ44", "links": [ [ "water", "water" ] ] } ], "word": "sukun" } { "head_templates": [ { "args": { "1": "kxd", "2": "noun" }, "expansion": "sukun", "name": "head" } ], "lang": "Brunei Malay", "lang_code": "kxd", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Brunei Malay entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Pages with 6 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "kind": "lifeform", "langcode": "kxd", "name": "Fruits", "orig": "kxd:Fruits", "parents": [ "Foods", "Plants", "Eating", "Food and drink", "Lifeforms", "Human behaviour", "All topics", "Life", "Human", "Fundamental", "Nature" ], "source": "w" } ], "glosses": [ "breadfruit, fruit of the tropical tree Artocarpus altilis" ], "id": "en-sukun-kxd-noun-fCpLVGzx", "links": [ [ "breadfruit", "breadfruit" ], [ "Artocarpus altilis", "Artocarpus altilis#Translingual" ] ] } ], "sounds": [ { "ipa": "/su.kun/" } ], "word": "sukun" } { "etymology_templates": [ { "args": { "1": "chk", "2": "en", "3": "school" }, "expansion": "English school", "name": "bor" } ], "etymology_text": "Borrowed from English school.", "head_templates": [ { "args": { "1": "chk", "2": "noun" }, "expansion": "sukun", "name": "head" } ], "lang": "Chuukese", "lang_code": "chk", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Chuukese entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Pages with 6 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" } ], "glosses": [ "school" ], "id": "en-sukun-chk-noun-1k3r2ULX", "links": [ [ "school", "school" ] ] } ], "word": "sukun" } { "forms": [ { "form": "سوکون", "tags": [ "Jawi" ] }, { "form": "sukun-sukun", "tags": [ "plural" ] } ], "head_templates": [ { "args": { "j": "سوکون" }, "expansion": "sukun (Jawi spelling سوکون, plural sukun-sukun)", "name": "ms-noun" } ], "lang": "Malay", "lang_code": "ms", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Malay entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Pages with 6 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "kind": "lifeform", "langcode": "ms", "name": "Fruits", "orig": "ms:Fruits", "parents": [ "Foods", "Plants", "Eating", "Food and drink", "Lifeforms", "Human behaviour", "All topics", "Life", "Human", "Fundamental", "Nature" ], "source": "w" } ], "glosses": [ "breadfruit, fruit of the tropical tree Artocarpus altilis" ], "id": "en-sukun-ms-noun-fCpLVGzx", "links": [ [ "breadfruit", "breadfruit" ], [ "Artocarpus altilis", "Artocarpus altilis#Translingual" ] ], "synonyms": [ { "word": "kulur" } ] } ], "sounds": [ { "ipa": "/sukon/", "tags": [ "Johor-Selangor" ] }, { "ipa": "/sukʊn/", "tags": [ "Riau-Lingga" ] }, { "rhymes": "-ukon" }, { "rhymes": "-kon" }, { "rhymes": "-on" } ], "word": "sukun" } { "head_templates": [ { "args": { "1": "szy", "2": "noun" }, "expansion": "sukun", "name": "head" } ], "lang": "Sakizaya", "lang_code": "szy", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Pages with 6 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Sakizaya entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" } ], "glosses": [ "skirt" ], "id": "en-sukun-szy-noun-Orr85bxU", "links": [ [ "skirt", "skirt" ] ] } ], "sounds": [ { "ipa": "/su.ˈkun/" }, { "ipa": "[su.ˈkun]" } ], "word": "sukun" }
{ "forms": [ { "form": "súkun", "tags": [ "canonical" ] } ], "head_templates": [ { "args": { "1": "aof", "2": "noun", "head": "súkun" }, "expansion": "súkun", "name": "head" } ], "lang": "Bragat", "lang_code": "aof", "pos": "noun", "senses": [ { "categories": [ "Bragat entries with incorrect language header", "Bragat lemmas", "Bragat nouns", "Pages with 6 entries", "Pages with entries" ], "glosses": [ "water" ], "links": [ [ "water", "water" ] ] } ], "word": "sukun" } { "head_templates": [ { "args": { "1": "kxd", "2": "noun" }, "expansion": "sukun", "name": "head" } ], "lang": "Brunei Malay", "lang_code": "kxd", "pos": "noun", "senses": [ { "categories": [ "Brunei Malay entries with incorrect language header", "Brunei Malay lemmas", "Brunei Malay nouns", "Pages with 6 entries", "Pages with entries", "kxd:Fruits" ], "glosses": [ "breadfruit, fruit of the tropical tree Artocarpus altilis" ], "links": [ [ "breadfruit", "breadfruit" ], [ "Artocarpus altilis", "Artocarpus altilis#Translingual" ] ] } ], "sounds": [ { "ipa": "/su.kun/" } ], "word": "sukun" } { "etymology_templates": [ { "args": { "1": "chk", "2": "en", "3": "school" }, "expansion": "English school", "name": "bor" } ], "etymology_text": "Borrowed from English school.", "head_templates": [ { "args": { "1": "chk", "2": "noun" }, "expansion": "sukun", "name": "head" } ], "lang": "Chuukese", "lang_code": "chk", "pos": "noun", "senses": [ { "categories": [ "Chuukese entries with incorrect language header", "Chuukese lemmas", "Chuukese nouns", "Chuukese terms borrowed from English", "Chuukese terms derived from English", "Pages with 6 entries", "Pages with entries" ], "glosses": [ "school" ], "links": [ [ "school", "school" ] ] } ], "word": "sukun" } { "etymology_templates": [ { "args": { "1": "en", "2": "ar", "3": "سُكُون" }, "expansion": "Borrowed from Arabic سُكُون (sukūn)", "name": "bor+" }, { "args": { "1": "en", "2": "ar", "3": "س ك ن" }, "expansion": "", "name": "root" } ], "etymology_text": "Borrowed from Arabic سُكُون (sukūn).", "forms": [ { "form": "sukuns", "tags": [ "plural" ] }, { "form": "sukkun", "tags": [ "alternative" ] }, { "form": "sukūn", "tags": [ "alternative" ] } ], "head_templates": [ { "args": {}, "expansion": "sukun (plural sukuns)", "name": "en-noun" } ], "lang": "English", "lang_code": "en", "pos": "noun", "related": [ { "word": "damma" }, { "word": "ḍamma" }, { "word": "fatha" }, { "word": "fatḥa" }, { "word": "kasra" }, { "word": "shadda" }, { "word": "šadda" }, { "word": "tashkil" }, { "word": "taškīl" } ], "senses": [ { "categories": [ "English countable nouns", "English entries with incorrect language header", "English lemmas", "English nouns", "English terms borrowed from Arabic", "English terms derived from Arabic", "English terms derived from the Arabic root س ك ن", "Entries with translation boxes", "Hindi terms with non-redundant manual transliterations", "Pages with 6 entries", "Pages with entries", "Terms with Arabic translations", "Terms with Azerbaijani translations", "Terms with Central Kurdish translations", "Terms with French translations", "Terms with German translations", "Terms with Hindi translations", "Terms with Japanese translations", "Terms with Kazakh translations", "Terms with Korean translations", "Terms with Malay translations", "Terms with Mandarin translations", "Terms with Northern Kurdish translations", "Terms with Pashto translations", "Terms with Persian translations", "Terms with Russian translations", "Terms with Tajik translations", "Terms with Turkish translations", "Terms with Urdu translations", "Terms with Uzbek translations", "Undetermined terms with redundant script codes", "en:Arabic letter names", "en:Diacritical marks" ], "examples": [ { "text": "Near-synonyms: virama, halant" } ], "glosses": [ "A diacritic (ـْ) used in the Arabic abjad to mark the absence of a vowel." ], "links": [ [ "diacritic", "diacritic" ], [ "ـْ", "ـْ" ], [ "abjad", "abjad" ] ], "wikipedia": [ "Arabic diacritics#Sukūn" ] } ], "translations": [ { "code": "ar", "lang": "Arabic", "roman": "sukūn", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "سُكُون" }, { "code": "az", "lang": "Azerbaijani", "sense": "Diacritic used to mark the absence of a vowel", "word": "sukuun" }, { "code": "cmn", "lang": "Chinese Mandarin", "roman": "jìngfú", "sense": "Diacritic used to mark the absence of a vowel", "word": "靜符 /静符" }, { "code": "fr", "lang": "French", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "feminine", "masculine" ], "word": "soukoun" }, { "code": "de", "lang": "German", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "neuter" ], "word": "Sukun" }, { "code": "hi", "lang": "Hindi", "roman": "jazm", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "जज़्म" }, { "code": "ja", "lang": "Japanese", "roman": "sukūn", "sense": "Diacritic used to mark the absence of a vowel", "word": "スクーン" }, { "code": "kk", "lang": "Kazakh", "roman": "sukun", "sense": "Diacritic used to mark the absence of a vowel", "word": "сукун" }, { "code": "ko", "lang": "Korean", "roman": "sukun", "sense": "Diacritic used to mark the absence of a vowel", "word": "수쿤" }, { "code": "ckb", "lang": "Central Kurdish", "roman": "zene", "sense": "Diacritic used to mark the absence of a vowel", "word": "زەنە" }, { "code": "kmr", "lang": "Northern Kurdish", "sense": "Diacritic used to mark the absence of a vowel", "word": "sikûn" }, { "code": "ms", "lang": "Malay", "sense": "Diacritic used to mark the absence of a vowel", "word": "baris mati" }, { "code": "ms", "lang": "Malay", "sense": "Diacritic used to mark the absence of a vowel", "word": "tanda mati" }, { "code": "ms", "lang": "Malay", "sense": "Diacritic used to mark the absence of a vowel", "word": "sukun" }, { "code": "ps", "lang": "Pashto", "roman": "sokun", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "سکون" }, { "code": "fa-ira", "lang": "Iranian Persian", "roman": "jazm", "sense": "Diacritic used to mark the absence of a vowel", "word": "جَزْم" }, { "code": "fa-ira", "lang": "Iranian Persian", "roman": "sâken", "sense": "Diacritic used to mark the absence of a vowel", "word": "ساکِن" }, { "code": "fa-ira", "lang": "Iranian Persian", "roman": "sokun", "sense": "Diacritic used to mark the absence of a vowel", "word": "سُکون" }, { "code": "ru", "lang": "Russian", "roman": "sukún", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "суку́н" }, { "code": "tg", "lang": "Tajik", "roman": "sukun", "sense": "Diacritic used to mark the absence of a vowel", "word": "сукун" }, { "code": "tg", "lang": "Tajik", "roman": "jazm", "sense": "Diacritic used to mark the absence of a vowel", "word": "ҷазм" }, { "code": "tr", "lang": "Turkish", "sense": "Diacritic used to mark the absence of a vowel", "word": "sükûn" }, { "code": "tr", "lang": "Turkish", "sense": "Diacritic used to mark the absence of a vowel", "word": "cezm" }, { "code": "ur", "lang": "Urdu", "roman": "jazm", "sense": "Diacritic used to mark the absence of a vowel", "tags": [ "masculine" ], "word": "جَزْم" }, { "code": "uz", "lang": "Uzbek", "sense": "Diacritic used to mark the absence of a vowel", "word": "sukun" }, { "code": "uz", "lang": "Uzbek", "sense": "Diacritic used to mark the absence of a vowel", "word": "jazm" } ], "word": "sukun" } { "forms": [ { "form": "سوکون", "tags": [ "Jawi" ] }, { "form": "sukun-sukun", "tags": [ "plural" ] } ], "head_templates": [ { "args": { "j": "سوکون" }, "expansion": "sukun (Jawi spelling سوکون, plural sukun-sukun)", "name": "ms-noun" } ], "lang": "Malay", "lang_code": "ms", "pos": "noun", "senses": [ { "categories": [ "Malay entries with incorrect language header", "Malay lemmas", "Malay nouns", "Pages with 6 entries", "Pages with entries", "Rhymes:Malay/kon", "Rhymes:Malay/on", "Rhymes:Malay/ukon", "ms:Fruits" ], "glosses": [ "breadfruit, fruit of the tropical tree Artocarpus altilis" ], "links": [ [ "breadfruit", "breadfruit" ], [ "Artocarpus altilis", "Artocarpus altilis#Translingual" ] ], "synonyms": [ { "word": "kulur" } ] } ], "sounds": [ { "ipa": "/sukon/", "tags": [ "Johor-Selangor" ] }, { "ipa": "/sukʊn/", "tags": [ "Riau-Lingga" ] }, { "rhymes": "-ukon" }, { "rhymes": "-kon" }, { "rhymes": "-on" } ], "word": "sukun" } { "head_templates": [ { "args": { "1": "szy", "2": "noun" }, "expansion": "sukun", "name": "head" } ], "lang": "Sakizaya", "lang_code": "szy", "pos": "noun", "senses": [ { "categories": [ "Pages with 6 entries", "Pages with entries", "Sakizaya entries with incorrect language header", "Sakizaya lemmas", "Sakizaya nouns", "Sakizaya terms with IPA pronunciation" ], "glosses": [ "skirt" ], "links": [ [ "skirt", "skirt" ] ] } ], "sounds": [ { "ipa": "/su.ˈkun/" }, { "ipa": "[su.ˈkun]" } ], "word": "sukun" }
Download raw JSONL data for sukun meaning in All languages combined (8.6kB)
This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2025-03-23 from the enwiktionary dump dated 2025-03-21 using wiktextract (fef8596 and 633533e). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.