See ဆူ on Wiktionary
{ "derived": [ { "_dis1": "0 0 0 0 0", "roman": "krakhcu", "word": "ကြက်ဆူ" }, { "_dis1": "0 0 0 0 0", "roman": "krakhcuhci", "word": "ကြက်ဆူဆီ" }, { "_dis1": "0 0 0 0 0", "roman": "nga:hcupang", "word": "ငါးဆူပင်" }, { "_dis1": "0 0 0 0 0", "roman": "hcuhce:", "word": "ဆူဆေး" }, { "_dis1": "0 0 0 0 0", "roman": "hcu-nyam", "word": "ဆူညံ" }, { "_dis1": "0 0 0 0 0", "roman": "hcu-pwak", "word": "ဆူပွက်" }, { "_dis1": "0 0 0 0 0", "roman": "hcupu", "word": "ဆူပူ" }, { "_dis1": "0 0 0 0 0", "roman": "hculwainaplwai", "word": "ဆူလွယ်နပ်လွယ်" }, { "_dis1": "0 0 0 0 0", "roman": "htin.hcu", "word": "ထိန့်ဆူ" }, { "_dis1": "0 0 0 0 0", "roman": "pwakpwakhcu", "word": "ပွက်ပွက်ဆူ" }, { "_dis1": "0 0 0 0 0", "roman": "mankyany:krakhcu", "word": "မန်ကျည်းကြက်ဆူ" }, { "_dis1": "0 0 0 0 0", "roman": "rehcuhmat", "word": "ရေဆူမှတ်" }, { "_dis1": "0 0 0 0 0", "roman": "swe:hcu", "word": "သွေးဆူ" } ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "Inherited" }, "expansion": "Inherited", "name": "glossary" }, { "args": { "1": "my", "2": "obr", "3": "ဆော", "4": "", "5": "", "g": "", "g2": "", "g3": "", "id": "", "lit": "", "nocat": "", "pos": "", "sc": "", "sort": "", "tr": "", "ts": "" }, "expansion": "Old Burmese ဆော", "name": "inh" }, { "args": { "1": "my", "2": "obr", "3": "ဆော" }, "expansion": "Inherited from Old Burmese ဆော", "name": "inh+" }, { "args": { "1": "my", "2": "sit-pro", "3": "*tsjow", "t": "to boil, burn, cook, bake" }, "expansion": "Proto-Sino-Tibetan *tsjow (“to boil, burn, cook, bake”)", "name": "inh" }, { "args": { "1": "och", "2": "-" }, "expansion": "Old Chinese", "name": "cog" }, { "args": { "1": "焦", "2": "to scorch" }, "expansion": "焦 (OC *ʔsew, “to scorch”)", "name": "och-l" } ], "etymology_text": "Inherited from Old Burmese ဆော, ultimately from Proto-Sino-Tibetan *tsjow (“to boil, burn, cook, bake”). Cognate with Old Chinese 焦 (OC *ʔsew, “to scorch”); see there for more (STEDT).\nThe \"be noisy\" sense isn't given etymology by STEDT (shu²² \"make a row, racket\") and isn't mentioned by Luce 1981, while MED considers it a semantic extension of the \"boil\" sense, which appears semantically reasonable.", "forms": [ { "form": "hcu", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "ဆူ • (hcu)", "name": "my-verb" } ], "lang": "Burmese", "lang_code": "my", "pos": "verb", "senses": [ { "categories": [], "glosses": [ "to boil, come to a boiling stage" ], "id": "en-ဆူ-my-verb-h-fd~ALT", "links": [ [ "water", "water" ], [ "liquid", "liquid" ], [ "boil", "boil" ], [ "come", "come" ], [ "boiling", "boiling" ], [ "stage", "stage" ] ], "qualifier": "liquid", "raw_glosses": [ "(intransitive, of water, liquid) to boil, come to a boiling stage" ], "raw_tags": [ "of water" ], "tags": [ "intransitive" ] }, { "glosses": [ "to effervesce, bubble, seethe" ], "id": "en-ဆူ-my-verb-4MMgHqBN", "links": [ [ "effervesce", "effervesce" ], [ "bubble", "bubble" ], [ "seethe", "seethe" ] ] }, { "glosses": [ "to be noisy, clamor" ], "id": "en-ဆူ-my-verb-397C0oLx", "links": [ [ "be", "be" ], [ "noisy", "noisy" ], [ "clamor", "clamor" ] ] }, { "glosses": [ "to scold, reprove" ], "id": "en-ဆူ-my-verb-fSMAgfmR", "links": [ [ "scold", "scold" ], [ "reprove", "reprove" ] ] }, { "glosses": [ "to be in a state of unrest" ], "id": "en-ဆူ-my-verb-CU6CSyct", "links": [ [ "state", "state" ], [ "unrest", "unrest" ] ] } ], "sounds": [ { "ipa": "/sʰù/" } ], "word": "ဆူ" } { "etymology_number": 2, "etymology_templates": [ { "args": { "1": "my", "2": "sit-pro", "3": "*tsow-s", "t": "fat, omentum" }, "expansion": "Proto-Sino-Tibetan *tsow-s (“fat, omentum”)", "name": "inh" }, { "args": { "1": "och", "2": "-" }, "expansion": "Old Chinese", "name": "cog" }, { "args": { "1": "臇", "2": "fatty; meaningful" }, "expansion": "臇 (OC *ʔsol, *ʔsonʔ, “fatty; meaningful”)", "name": "och-l" } ], "etymology_text": "From Proto-Sino-Tibetan *tsow-s (“fat, omentum”). Cognate with Old Chinese 臇 (OC *ʔsol, *ʔsonʔ, “fatty; meaningful”); see there for more (STEDT).", "forms": [ { "form": "hcu", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "ဆူ • (hcu)", "name": "my-adj" } ], "lang": "Burmese", "lang_code": "my", "pos": "adj", "senses": [ { "glosses": [ "plump, fat (thick)" ], "id": "en-ဆူ-my-adj-6FRjtK~T", "links": [ [ "plump", "plump" ], [ "fat", "fat" ], [ "thick", "thick#English" ] ] } ], "sounds": [ { "ipa": "/sʰù/" } ], "word": "ဆူ" } { "etymology_number": 2, "etymology_templates": [ { "args": { "1": "my", "2": "sit-pro", "3": "*tsow-s", "t": "fat, omentum" }, "expansion": "Proto-Sino-Tibetan *tsow-s (“fat, omentum”)", "name": "inh" }, { "args": { "1": "och", "2": "-" }, "expansion": "Old Chinese", "name": "cog" }, { "args": { "1": "臇", "2": "fatty; meaningful" }, "expansion": "臇 (OC *ʔsol, *ʔsonʔ, “fatty; meaningful”)", "name": "och-l" } ], "etymology_text": "From Proto-Sino-Tibetan *tsow-s (“fat, omentum”). Cognate with Old Chinese 臇 (OC *ʔsol, *ʔsonʔ, “fatty; meaningful”); see there for more (STEDT).", "forms": [ { "form": "hcu", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "ဆူ • (hcu)", "name": "my-verb" } ], "lang": "Burmese", "lang_code": "my", "pos": "verb", "senses": [ { "derived": [ { "roman": "hcu-krumnim.mrang.ma.rwe:", "word": "ဆူကြုံနိမ့်မြင့်မရွေး" }, { "roman": "hcuhprui:", "word": "ဆူဖြိုး" } ], "glosses": [ "to be plump, be well-filled out" ], "id": "en-ဆူ-my-verb-J8Ch2Sqe", "links": [ [ "be", "be" ], [ "well", "well" ], [ "filled out", "filled out" ] ] } ], "sounds": [ { "ipa": "/sʰù/" } ], "word": "ဆူ" } { "etymology_number": 3, "etymology_templates": [ { "args": { "1": "my", "2": "tbq-pro", "3": "*tsu", "t": "spirit of dead" }, "expansion": "Proto-Tibeto-Burman *tsu (“spirit of dead”)", "name": "inh" }, { "args": { "1": "kac", "t": "spirit", "tr": "tsù" }, "expansion": "Jingpho [script needed] (tsù, “spirit”)", "name": "cog" }, { "args": { "1": "och", "2": "-" }, "expansion": "Old Chinese", "name": "cog" }, { "args": { "1": "座", "2": "classifier for buildings" }, "expansion": "座 (OC *zoːls, “classifier for buildings”)", "name": "och-l" } ], "etymology_text": "From Proto-Tibeto-Burman *tsu (“spirit of dead”); cognate with Jingpho [script needed] (tsù, “spirit”) (STEDT). Note also similarities to Old Chinese 座 (OC *zoːls, “classifier for buildings”).", "forms": [ { "form": "hcu", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "my", "2": "classifier" }, "expansion": "ဆူ • (hcu)", "name": "head" } ], "lang": "Burmese", "lang_code": "my", "pos": "classifier", "senses": [ { "categories": [ { "kind": "topical", "langcode": "my", "name": "Buddhism", "orig": "my:Buddhism", "parents": [ "Religion", "Culture", "Society", "All topics", "Fundamental" ], "source": "w" }, { "_dis": "2 57 5 2 7 18 0 9", "kind": "other", "name": "Burmese classifiers", "parents": [], "source": "w+disamb" }, { "_dis": "4 35 8 4 8 20 3 19", "kind": "other", "name": "Burmese entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "6 45 8 6 6 7 4 18", "kind": "other", "name": "Pages with 2 entries", "parents": [], "source": "w+disamb" }, { "_dis": "5 41 7 5 5 7 4 27", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" } ], "derived": [ { "roman": "hcuhlai", "word": "ဆူလှယ်" }, { "roman": "hnackyiphrachcu-pwai:", "word": "နှစ်ကျိပ်ရှစ်ဆူပွဲ" }, { "roman": "bhu.ra:kui:hcu", "word": "ဘုရားကိုးဆူ" }, { "roman": "bhu.ra:tachcugutaclum:", "word": "ဘုရားတစ်ဆူဂူတစ်လုံး" } ], "examples": [ { "english": "two pagodas", "roman": "bhu.ra: hnachcu", "text": "ဘုရား နှစ်ဆူ", "type": "example" } ], "glosses": [ "numerical classifier for pagodas, images of the Buddha, and other sacred objects" ], "id": "en-ဆူ-my-classifier-qZ-alT1k", "links": [ [ "Buddhism", "Buddhism" ], [ "pagoda", "pagoda#English" ], [ "image", "image#English" ], [ "Buddha", "Buddha#English" ], [ "sacred", "sacred#English" ], [ "object", "object#English" ] ], "raw_glosses": [ "(Buddhism) numerical classifier for pagodas, images of the Buddha, and other sacred objects" ], "topics": [ "Buddhism", "lifestyle", "religion" ] } ], "sounds": [ { "ipa": "/sʰù/" } ], "word": "ဆူ" } { "forms": [ { "form": "hsoo", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "ksw", "2": "preposition" }, "expansion": "ဆူ • (hsoo)", "name": "head" } ], "lang": "S'gaw Karen", "lang_code": "ksw", "pos": "prep", "senses": [ { "categories": [ { "kind": "other", "name": "Pages with 2 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "kind": "other", "name": "S'gaw Karen entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "S'gaw Karen prepositions", "parents": [], "source": "w" } ], "glosses": [ "Used to indicate destination: to" ], "id": "en-ဆူ-ksw-prep-mK~XWiwz", "links": [ [ "to", "to" ] ] } ], "word": "ဆူ" }
{ "categories": [ "Burmese classifiers", "Burmese entries with incorrect language header", "Burmese lemmas", "Burmese terms derived from Old Burmese", "Burmese terms derived from Proto-Sino-Tibetan", "Burmese terms derived from Proto-Tibeto-Burman", "Burmese terms inherited from Old Burmese", "Burmese terms inherited from Proto-Sino-Tibetan", "Burmese terms inherited from Proto-Tibeto-Burman", "Burmese terms with IPA pronunciation", "Burmese verbs", "Pages with 2 entries", "Pages with entries", "Requests for native script for Jingpho terms" ], "derived": [ { "roman": "krakhcu", "word": "ကြက်ဆူ" }, { "roman": "krakhcuhci", "word": "ကြက်ဆူဆီ" }, { "roman": "nga:hcupang", "word": "ငါးဆူပင်" }, { "roman": "hcuhce:", "word": "ဆူဆေး" }, { "roman": "hcu-nyam", "word": "ဆူညံ" }, { "roman": "hcu-pwak", "word": "ဆူပွက်" }, { "roman": "hcupu", "word": "ဆူပူ" }, { "roman": "hculwainaplwai", "word": "ဆူလွယ်နပ်လွယ်" }, { "roman": "htin.hcu", "word": "ထိန့်ဆူ" }, { "roman": "pwakpwakhcu", "word": "ပွက်ပွက်ဆူ" }, { "roman": "mankyany:krakhcu", "word": "မန်ကျည်းကြက်ဆူ" }, { "roman": "rehcuhmat", "word": "ရေဆူမှတ်" }, { "roman": "swe:hcu", "word": "သွေးဆူ" } ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "Inherited" }, "expansion": "Inherited", "name": "glossary" }, { "args": { "1": "my", "2": "obr", "3": "ဆော", "4": "", "5": "", "g": "", "g2": "", "g3": "", "id": "", "lit": "", "nocat": "", "pos": "", "sc": "", "sort": "", "tr": "", "ts": "" }, "expansion": "Old Burmese ဆော", "name": "inh" }, { "args": { "1": "my", "2": "obr", "3": "ဆော" }, "expansion": "Inherited from Old Burmese ဆော", "name": "inh+" }, { "args": { "1": "my", "2": "sit-pro", "3": "*tsjow", "t": "to boil, burn, cook, bake" }, "expansion": "Proto-Sino-Tibetan *tsjow (“to boil, burn, cook, bake”)", "name": "inh" }, { "args": { "1": "och", "2": "-" }, "expansion": "Old Chinese", "name": "cog" }, { "args": { "1": "焦", "2": "to scorch" }, "expansion": "焦 (OC *ʔsew, “to scorch”)", "name": "och-l" } ], "etymology_text": "Inherited from Old Burmese ဆော, ultimately from Proto-Sino-Tibetan *tsjow (“to boil, burn, cook, bake”). Cognate with Old Chinese 焦 (OC *ʔsew, “to scorch”); see there for more (STEDT).\nThe \"be noisy\" sense isn't given etymology by STEDT (shu²² \"make a row, racket\") and isn't mentioned by Luce 1981, while MED considers it a semantic extension of the \"boil\" sense, which appears semantically reasonable.", "forms": [ { "form": "hcu", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "ဆူ • (hcu)", "name": "my-verb" } ], "lang": "Burmese", "lang_code": "my", "pos": "verb", "senses": [ { "categories": [ "Burmese intransitive verbs" ], "glosses": [ "to boil, come to a boiling stage" ], "links": [ [ "water", "water" ], [ "liquid", "liquid" ], [ "boil", "boil" ], [ "come", "come" ], [ "boiling", "boiling" ], [ "stage", "stage" ] ], "qualifier": "liquid", "raw_glosses": [ "(intransitive, of water, liquid) to boil, come to a boiling stage" ], "raw_tags": [ "of water" ], "tags": [ "intransitive" ] }, { "glosses": [ "to effervesce, bubble, seethe" ], "links": [ [ "effervesce", "effervesce" ], [ "bubble", "bubble" ], [ "seethe", "seethe" ] ] }, { "glosses": [ "to be noisy, clamor" ], "links": [ [ "be", "be" ], [ "noisy", "noisy" ], [ "clamor", "clamor" ] ] }, { "glosses": [ "to scold, reprove" ], "links": [ [ "scold", "scold" ], [ "reprove", "reprove" ] ] }, { "glosses": [ "to be in a state of unrest" ], "links": [ [ "state", "state" ], [ "unrest", "unrest" ] ] } ], "sounds": [ { "ipa": "/sʰù/" } ], "word": "ဆူ" } { "categories": [ "Burmese adjectives", "Burmese classifiers", "Burmese entries with incorrect language header", "Burmese lemmas", "Burmese terms derived from Proto-Sino-Tibetan", "Burmese terms derived from Proto-Tibeto-Burman", "Burmese terms inherited from Proto-Sino-Tibetan", "Burmese terms inherited from Proto-Tibeto-Burman", "Burmese terms with IPA pronunciation", "Burmese verbs", "Pages with 2 entries", "Pages with entries", "Requests for native script for Jingpho terms" ], "etymology_number": 2, "etymology_templates": [ { "args": { "1": "my", "2": "sit-pro", "3": "*tsow-s", "t": "fat, omentum" }, "expansion": "Proto-Sino-Tibetan *tsow-s (“fat, omentum”)", "name": "inh" }, { "args": { "1": "och", "2": "-" }, "expansion": "Old Chinese", "name": "cog" }, { "args": { "1": "臇", "2": "fatty; meaningful" }, "expansion": "臇 (OC *ʔsol, *ʔsonʔ, “fatty; meaningful”)", "name": "och-l" } ], "etymology_text": "From Proto-Sino-Tibetan *tsow-s (“fat, omentum”). Cognate with Old Chinese 臇 (OC *ʔsol, *ʔsonʔ, “fatty; meaningful”); see there for more (STEDT).", "forms": [ { "form": "hcu", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "ဆူ • (hcu)", "name": "my-adj" } ], "lang": "Burmese", "lang_code": "my", "pos": "adj", "senses": [ { "glosses": [ "plump, fat (thick)" ], "links": [ [ "plump", "plump" ], [ "fat", "fat" ], [ "thick", "thick#English" ] ] } ], "sounds": [ { "ipa": "/sʰù/" } ], "word": "ဆူ" } { "categories": [ "Burmese adjectives", "Burmese classifiers", "Burmese entries with incorrect language header", "Burmese lemmas", "Burmese terms derived from Proto-Sino-Tibetan", "Burmese terms derived from Proto-Tibeto-Burman", "Burmese terms inherited from Proto-Sino-Tibetan", "Burmese terms inherited from Proto-Tibeto-Burman", "Burmese terms with IPA pronunciation", "Burmese verbs", "Pages with 2 entries", "Pages with entries", "Requests for native script for Jingpho terms" ], "derived": [ { "roman": "hcu-krumnim.mrang.ma.rwe:", "word": "ဆူကြုံနိမ့်မြင့်မရွေး" }, { "roman": "hcuhprui:", "word": "ဆူဖြိုး" } ], "etymology_number": 2, "etymology_templates": [ { "args": { "1": "my", "2": "sit-pro", "3": "*tsow-s", "t": "fat, omentum" }, "expansion": "Proto-Sino-Tibetan *tsow-s (“fat, omentum”)", "name": "inh" }, { "args": { "1": "och", "2": "-" }, "expansion": "Old Chinese", "name": "cog" }, { "args": { "1": "臇", "2": "fatty; meaningful" }, "expansion": "臇 (OC *ʔsol, *ʔsonʔ, “fatty; meaningful”)", "name": "och-l" } ], "etymology_text": "From Proto-Sino-Tibetan *tsow-s (“fat, omentum”). Cognate with Old Chinese 臇 (OC *ʔsol, *ʔsonʔ, “fatty; meaningful”); see there for more (STEDT).", "forms": [ { "form": "hcu", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "ဆူ • (hcu)", "name": "my-verb" } ], "lang": "Burmese", "lang_code": "my", "pos": "verb", "senses": [ { "glosses": [ "to be plump, be well-filled out" ], "links": [ [ "be", "be" ], [ "well", "well" ], [ "filled out", "filled out" ] ] } ], "sounds": [ { "ipa": "/sʰù/" } ], "word": "ဆူ" } { "categories": [ "Burmese classifiers", "Burmese entries with incorrect language header", "Burmese lemmas", "Burmese terms derived from Proto-Tibeto-Burman", "Burmese terms inherited from Proto-Tibeto-Burman", "Burmese terms with IPA pronunciation", "Pages with 2 entries", "Pages with entries", "Requests for native script for Jingpho terms" ], "derived": [ { "roman": "hcuhlai", "word": "ဆူလှယ်" }, { "roman": "hnackyiphrachcu-pwai:", "word": "နှစ်ကျိပ်ရှစ်ဆူပွဲ" }, { "roman": "bhu.ra:kui:hcu", "word": "ဘုရားကိုးဆူ" }, { "roman": "bhu.ra:tachcugutaclum:", "word": "ဘုရားတစ်ဆူဂူတစ်လုံး" } ], "etymology_number": 3, "etymology_templates": [ { "args": { "1": "my", "2": "tbq-pro", "3": "*tsu", "t": "spirit of dead" }, "expansion": "Proto-Tibeto-Burman *tsu (“spirit of dead”)", "name": "inh" }, { "args": { "1": "kac", "t": "spirit", "tr": "tsù" }, "expansion": "Jingpho [script needed] (tsù, “spirit”)", "name": "cog" }, { "args": { "1": "och", "2": "-" }, "expansion": "Old Chinese", "name": "cog" }, { "args": { "1": "座", "2": "classifier for buildings" }, "expansion": "座 (OC *zoːls, “classifier for buildings”)", "name": "och-l" } ], "etymology_text": "From Proto-Tibeto-Burman *tsu (“spirit of dead”); cognate with Jingpho [script needed] (tsù, “spirit”) (STEDT). Note also similarities to Old Chinese 座 (OC *zoːls, “classifier for buildings”).", "forms": [ { "form": "hcu", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "my", "2": "classifier" }, "expansion": "ဆူ • (hcu)", "name": "head" } ], "lang": "Burmese", "lang_code": "my", "pos": "classifier", "senses": [ { "categories": [ "Burmese terms with usage examples", "my:Buddhism" ], "examples": [ { "english": "two pagodas", "roman": "bhu.ra: hnachcu", "text": "ဘုရား နှစ်ဆူ", "type": "example" } ], "glosses": [ "numerical classifier for pagodas, images of the Buddha, and other sacred objects" ], "links": [ [ "Buddhism", "Buddhism" ], [ "pagoda", "pagoda#English" ], [ "image", "image#English" ], [ "Buddha", "Buddha#English" ], [ "sacred", "sacred#English" ], [ "object", "object#English" ] ], "raw_glosses": [ "(Buddhism) numerical classifier for pagodas, images of the Buddha, and other sacred objects" ], "topics": [ "Buddhism", "lifestyle", "religion" ] } ], "sounds": [ { "ipa": "/sʰù/" } ], "word": "ဆူ" } { "forms": [ { "form": "hsoo", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "ksw", "2": "preposition" }, "expansion": "ဆူ • (hsoo)", "name": "head" } ], "lang": "S'gaw Karen", "lang_code": "ksw", "pos": "prep", "senses": [ { "categories": [ "Pages with 2 entries", "Pages with entries", "S'gaw Karen entries with incorrect language header", "S'gaw Karen lemmas", "S'gaw Karen prepositions" ], "glosses": [ "Used to indicate destination: to" ], "links": [ [ "to", "to" ] ] } ], "word": "ဆူ" }
Download raw JSONL data for ဆူ meaning in All languages combined (9.5kB)
This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2024-12-15 from the enwiktionary dump dated 2024-12-04 using wiktextract (8a39820 and 4401a4c). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.