See thứ in All languages combined, or Wiktionary
Download JSON data for thứ meaning in Vietnamese (8.4kB)
{ "etymology_number": 1, "etymology_templates": [ { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "次" }, "expansion": "Sino-Vietnamese word from 次", "name": "vi-etym-sino" }, { "args": { "1": "km", "2": "ទី" }, "expansion": "Khmer ទី (tii)", "name": "ncog" }, { "args": { "1": "th", "2": "ที่" }, "expansion": "Thai ที่ (tîi)", "name": "ncog" }, { "args": { "1": "ja", "2": "第", "tr": "dai" }, "expansion": "Japanese 第 (dai)", "name": "ncog" }, { "args": { "1": "zh", "2": "-" }, "expansion": "Chinese", "name": "ncog" }, { "args": { "1": "第" }, "expansion": "第 (MC dejH)", "name": "ltc-l" } ], "etymology_text": "Sino-Vietnamese word from 次.\nNote that in spite of superficial similarity, this word is unrelated to Khmer ទី (tii), Thai ที่ (tîi), Japanese 第 (dai), all from Chinese 第 (MC dejH) (SV: đệ).", "head_templates": [ { "args": { "1": "vi", "2": "adjective", "3": "", "4": "", "5": "", "6": "", "head": "", "tr": "" }, "expansion": "thứ", "name": "head" }, { "args": {}, "expansion": "thứ", "name": "vi-adj" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "adj", "senses": [ { "categories": [ { "_dis": "34 34 7 0 25", "kind": "other", "name": "Sino-Vietnamese words", "parents": [], "source": "w+disamb" }, { "_dis": "42 50 8 0", "kind": "other", "name": "Vietnamese classifiers", "parents": [], "source": "w+disamb" } ], "glosses": [ "inferior in quality, second, second vice, under" ], "id": "en-thứ-vi-adj-zYqYIp59", "links": [ [ "inferior", "inferior" ], [ "quality", "quality" ], [ "second", "second" ], [ "vice", "vice" ], [ "under", "under" ] ] } ], "sounds": [ { "ipa": "[tʰɨ˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[tʰɨ˨˩˦]", "tags": [ "Huế" ] }, { "ipa": "[tʰɨ˦˥]", "tags": [ "Hồ-Chí-Minh-City" ] }, { "audio": "LL-Q9199 (vie)-Penn Zero MSSJ-thứ.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.ogg", "tags": [ "Hà-Nội" ], "text": "Audio (Hà Nội)" } ], "word": "thứ" } { "etymology_number": 1, "etymology_templates": [ { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "次" }, "expansion": "Sino-Vietnamese word from 次", "name": "vi-etym-sino" }, { "args": { "1": "km", "2": "ទី" }, "expansion": "Khmer ទី (tii)", "name": "ncog" }, { "args": { "1": "th", "2": "ที่" }, "expansion": "Thai ที่ (tîi)", "name": "ncog" }, { "args": { "1": "ja", "2": "第", "tr": "dai" }, "expansion": "Japanese 第 (dai)", "name": "ncog" }, { "args": { "1": "zh", "2": "-" }, "expansion": "Chinese", "name": "ncog" }, { "args": { "1": "第" }, "expansion": "第 (MC dejH)", "name": "ltc-l" } ], "etymology_text": "Sino-Vietnamese word from 次.\nNote that in spite of superficial similarity, this word is unrelated to Khmer ទី (tii), Thai ที่ (tîi), Japanese 第 (dai), all from Chinese 第 (MC dejH) (SV: đệ).", "head_templates": [ { "args": { "1": "vi", "2": "noun", "3": "", "4": "", "head": "", "tr": "" }, "expansion": "thứ", "name": "head" }, { "args": {}, "expansion": "thứ", "name": "vi-noun" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "noun", "senses": [ { "glosses": [ "order, rank, sort, type, kind, category" ], "id": "en-thứ-vi-noun-r1GN8ouq", "links": [ [ "order", "order" ], [ "rank", "rank" ], [ "sort", "sort" ], [ "type", "type" ], [ "kind", "kind" ], [ "category", "category" ] ] }, { "glosses": [ "thing" ], "id": "en-thứ-vi-noun-XelNaRrj", "links": [ [ "thing", "thing" ] ] } ], "sounds": [ { "ipa": "[tʰɨ˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[tʰɨ˨˩˦]", "tags": [ "Huế" ] }, { "ipa": "[tʰɨ˦˥]", "tags": [ "Hồ-Chí-Minh-City" ] }, { "audio": "LL-Q9199 (vie)-Penn Zero MSSJ-thứ.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.ogg", "tags": [ "Hà-Nội" ], "text": "Audio (Hà Nội)" } ], "word": "thứ" } { "etymology_number": 1, "etymology_templates": [ { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "次" }, "expansion": "Sino-Vietnamese word from 次", "name": "vi-etym-sino" }, { "args": { "1": "km", "2": "ទី" }, "expansion": "Khmer ទី (tii)", "name": "ncog" }, { "args": { "1": "th", "2": "ที่" }, "expansion": "Thai ที่ (tîi)", "name": "ncog" }, { "args": { "1": "ja", "2": "第", "tr": "dai" }, "expansion": "Japanese 第 (dai)", "name": "ncog" }, { "args": { "1": "zh", "2": "-" }, "expansion": "Chinese", "name": "ncog" }, { "args": { "1": "第" }, "expansion": "第 (MC dejH)", "name": "ltc-l" } ], "etymology_text": "Sino-Vietnamese word from 次.\nNote that in spite of superficial similarity, this word is unrelated to Khmer ទី (tii), Thai ที่ (tîi), Japanese 第 (dai), all from Chinese 第 (MC dejH) (SV: đệ).", "head_templates": [ { "args": { "1": "vi", "2": "classifier", "head": "", "tr": "" }, "expansion": "thứ", "name": "head" }, { "args": {}, "expansion": "thứ", "name": "vi-cls" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "classifier", "senses": [ { "categories": [ { "_dis": "34 34 7 0 25", "kind": "other", "name": "Sino-Vietnamese words", "parents": [], "source": "w+disamb" }, { "_dis": "42 50 8 0", "kind": "other", "name": "Vietnamese classifiers", "parents": [], "source": "w+disamb" }, { "_dis": "23 69 2 0 6", "kind": "other", "name": "Vietnamese entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "40 50 10 0", "kind": "other", "name": "Vietnamese nouns without classifiers", "parents": [], "source": "w+disamb" } ], "glosses": [ "Indicates things of the same category, such as languages (tiếng)" ], "id": "en-thứ-vi-classifier-0rRl0A5b", "links": [ [ "same", "same#English" ], [ "category", "category#English" ], [ "language", "language#English" ], [ "tiếng", "tiếng#Vietnamese" ] ] } ], "sounds": [ { "ipa": "[tʰɨ˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[tʰɨ˨˩˦]", "tags": [ "Huế" ] }, { "ipa": "[tʰɨ˦˥]", "tags": [ "Hồ-Chí-Minh-City" ] }, { "audio": "LL-Q9199 (vie)-Penn Zero MSSJ-thứ.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.ogg", "tags": [ "Hà-Nội" ], "text": "Audio (Hà Nội)" } ], "word": "thứ" } { "etymology_number": 2, "etymology_templates": [ { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "恕" }, "expansion": "Sino-Vietnamese word from 恕", "name": "vi-etym-sino" } ], "etymology_text": "Sino-Vietnamese word from 恕.", "head_templates": [ { "args": { "1": "vi", "2": "verb", "3": "", "4": "", "head": "", "tr": "" }, "expansion": "thứ", "name": "head" }, { "args": {}, "expansion": "thứ", "name": "vi-verb" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "verb", "senses": [ { "categories": [ { "_dis": "34 34 7 0 25", "kind": "other", "name": "Sino-Vietnamese words", "parents": [], "source": "w+disamb" } ], "glosses": [ "to pardon, to forgive" ], "id": "en-thứ-vi-verb-A4~qxycZ", "links": [ [ "pardon", "pardon" ], [ "forgive", "forgive" ] ], "raw_glosses": [ "(chiefly in compounds, literary) to pardon, to forgive" ], "related": [ { "word": "tha thứ" } ], "tags": [ "in-compounds", "literary" ] } ], "sounds": [ { "ipa": "[tʰɨ˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[tʰɨ˨˩˦]", "tags": [ "Huế" ] }, { "ipa": "[tʰɨ˦˥]", "tags": [ "Hồ-Chí-Minh-City" ] }, { "audio": "LL-Q9199 (vie)-Penn Zero MSSJ-thứ.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.ogg", "tags": [ "Hà-Nội" ], "text": "Audio (Hà Nội)" } ], "word": "thứ" }
{ "categories": [ "Sino-Vietnamese words", "Vietnamese adjectives", "Vietnamese classifiers", "Vietnamese entries with incorrect language header", "Vietnamese lemmas", "Vietnamese nouns", "Vietnamese nouns without classifiers", "Vietnamese terms with IPA pronunciation", "Vietnamese terms with audio links", "Vietnamese verbs" ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "次" }, "expansion": "Sino-Vietnamese word from 次", "name": "vi-etym-sino" }, { "args": { "1": "km", "2": "ទី" }, "expansion": "Khmer ទី (tii)", "name": "ncog" }, { "args": { "1": "th", "2": "ที่" }, "expansion": "Thai ที่ (tîi)", "name": "ncog" }, { "args": { "1": "ja", "2": "第", "tr": "dai" }, "expansion": "Japanese 第 (dai)", "name": "ncog" }, { "args": { "1": "zh", "2": "-" }, "expansion": "Chinese", "name": "ncog" }, { "args": { "1": "第" }, "expansion": "第 (MC dejH)", "name": "ltc-l" } ], "etymology_text": "Sino-Vietnamese word from 次.\nNote that in spite of superficial similarity, this word is unrelated to Khmer ទី (tii), Thai ที่ (tîi), Japanese 第 (dai), all from Chinese 第 (MC dejH) (SV: đệ).", "head_templates": [ { "args": { "1": "vi", "2": "adjective", "3": "", "4": "", "5": "", "6": "", "head": "", "tr": "" }, "expansion": "thứ", "name": "head" }, { "args": {}, "expansion": "thứ", "name": "vi-adj" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "adj", "senses": [ { "glosses": [ "inferior in quality, second, second vice, under" ], "links": [ [ "inferior", "inferior" ], [ "quality", "quality" ], [ "second", "second" ], [ "vice", "vice" ], [ "under", "under" ] ] } ], "sounds": [ { "ipa": "[tʰɨ˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[tʰɨ˨˩˦]", "tags": [ "Huế" ] }, { "ipa": "[tʰɨ˦˥]", "tags": [ "Hồ-Chí-Minh-City" ] }, { "audio": "LL-Q9199 (vie)-Penn Zero MSSJ-thứ.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.ogg", "tags": [ "Hà-Nội" ], "text": "Audio (Hà Nội)" } ], "word": "thứ" } { "categories": [ "Sino-Vietnamese words", "Vietnamese adjectives", "Vietnamese classifiers", "Vietnamese entries with incorrect language header", "Vietnamese lemmas", "Vietnamese nouns", "Vietnamese nouns without classifiers", "Vietnamese terms with IPA pronunciation", "Vietnamese terms with audio links", "Vietnamese verbs" ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "次" }, "expansion": "Sino-Vietnamese word from 次", "name": "vi-etym-sino" }, { "args": { "1": "km", "2": "ទី" }, "expansion": "Khmer ទី (tii)", "name": "ncog" }, { "args": { "1": "th", "2": "ที่" }, "expansion": "Thai ที่ (tîi)", "name": "ncog" }, { "args": { "1": "ja", "2": "第", "tr": "dai" }, "expansion": "Japanese 第 (dai)", "name": "ncog" }, { "args": { "1": "zh", "2": "-" }, "expansion": "Chinese", "name": "ncog" }, { "args": { "1": "第" }, "expansion": "第 (MC dejH)", "name": "ltc-l" } ], "etymology_text": "Sino-Vietnamese word from 次.\nNote that in spite of superficial similarity, this word is unrelated to Khmer ទី (tii), Thai ที่ (tîi), Japanese 第 (dai), all from Chinese 第 (MC dejH) (SV: đệ).", "head_templates": [ { "args": { "1": "vi", "2": "noun", "3": "", "4": "", "head": "", "tr": "" }, "expansion": "thứ", "name": "head" }, { "args": {}, "expansion": "thứ", "name": "vi-noun" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "noun", "senses": [ { "glosses": [ "order, rank, sort, type, kind, category" ], "links": [ [ "order", "order" ], [ "rank", "rank" ], [ "sort", "sort" ], [ "type", "type" ], [ "kind", "kind" ], [ "category", "category" ] ] }, { "glosses": [ "thing" ], "links": [ [ "thing", "thing" ] ] } ], "sounds": [ { "ipa": "[tʰɨ˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[tʰɨ˨˩˦]", "tags": [ "Huế" ] }, { "ipa": "[tʰɨ˦˥]", "tags": [ "Hồ-Chí-Minh-City" ] }, { "audio": "LL-Q9199 (vie)-Penn Zero MSSJ-thứ.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.ogg", "tags": [ "Hà-Nội" ], "text": "Audio (Hà Nội)" } ], "word": "thứ" } { "categories": [ "Sino-Vietnamese words", "Vietnamese adjectives", "Vietnamese classifiers", "Vietnamese entries with incorrect language header", "Vietnamese lemmas", "Vietnamese nouns", "Vietnamese nouns without classifiers", "Vietnamese terms with IPA pronunciation", "Vietnamese terms with audio links", "Vietnamese verbs" ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "次" }, "expansion": "Sino-Vietnamese word from 次", "name": "vi-etym-sino" }, { "args": { "1": "km", "2": "ទី" }, "expansion": "Khmer ទី (tii)", "name": "ncog" }, { "args": { "1": "th", "2": "ที่" }, "expansion": "Thai ที่ (tîi)", "name": "ncog" }, { "args": { "1": "ja", "2": "第", "tr": "dai" }, "expansion": "Japanese 第 (dai)", "name": "ncog" }, { "args": { "1": "zh", "2": "-" }, "expansion": "Chinese", "name": "ncog" }, { "args": { "1": "第" }, "expansion": "第 (MC dejH)", "name": "ltc-l" } ], "etymology_text": "Sino-Vietnamese word from 次.\nNote that in spite of superficial similarity, this word is unrelated to Khmer ទី (tii), Thai ที่ (tîi), Japanese 第 (dai), all from Chinese 第 (MC dejH) (SV: đệ).", "head_templates": [ { "args": { "1": "vi", "2": "classifier", "head": "", "tr": "" }, "expansion": "thứ", "name": "head" }, { "args": {}, "expansion": "thứ", "name": "vi-cls" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "classifier", "senses": [ { "glosses": [ "Indicates things of the same category, such as languages (tiếng)" ], "links": [ [ "same", "same#English" ], [ "category", "category#English" ], [ "language", "language#English" ], [ "tiếng", "tiếng#Vietnamese" ] ] } ], "sounds": [ { "ipa": "[tʰɨ˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[tʰɨ˨˩˦]", "tags": [ "Huế" ] }, { "ipa": "[tʰɨ˦˥]", "tags": [ "Hồ-Chí-Minh-City" ] }, { "audio": "LL-Q9199 (vie)-Penn Zero MSSJ-thứ.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.ogg", "tags": [ "Hà-Nội" ], "text": "Audio (Hà Nội)" } ], "word": "thứ" } { "categories": [ "Sino-Vietnamese words", "Vietnamese entries with incorrect language header", "Vietnamese lemmas", "Vietnamese terms with IPA pronunciation", "Vietnamese terms with audio links", "Vietnamese verbs" ], "etymology_number": 2, "etymology_templates": [ { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "恕" }, "expansion": "Sino-Vietnamese word from 恕", "name": "vi-etym-sino" } ], "etymology_text": "Sino-Vietnamese word from 恕.", "head_templates": [ { "args": { "1": "vi", "2": "verb", "3": "", "4": "", "head": "", "tr": "" }, "expansion": "thứ", "name": "head" }, { "args": {}, "expansion": "thứ", "name": "vi-verb" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "verb", "related": [ { "word": "tha thứ" } ], "senses": [ { "categories": [ "Vietnamese literary terms" ], "glosses": [ "to pardon, to forgive" ], "links": [ [ "pardon", "pardon" ], [ "forgive", "forgive" ] ], "raw_glosses": [ "(chiefly in compounds, literary) to pardon, to forgive" ], "tags": [ "in-compounds", "literary" ] } ], "sounds": [ { "ipa": "[tʰɨ˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[tʰɨ˨˩˦]", "tags": [ "Huế" ] }, { "ipa": "[tʰɨ˦˥]", "tags": [ "Hồ-Chí-Minh-City" ] }, { "audio": "LL-Q9199 (vie)-Penn Zero MSSJ-thứ.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/3/3d/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav/LL-Q9199_%28vie%29-Penn_Zero_MSSJ-th%E1%BB%A9.wav.ogg", "tags": [ "Hà-Nội" ], "text": "Audio (Hà Nội)" } ], "word": "thứ" }
This page is a part of the kaikki.org machine-readable Vietnamese dictionary. This dictionary is based on structured data extracted on 2024-05-24 from the enwiktionary dump dated 2024-05-02 using wiktextract (46b31b8 and c7ea76d). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.