See 쪽 on Wiktionary
{ "etymology_number": 1, "etymology_templates": [ { "args": { "1": "gci", "2": "쪽", "3": "ccwok" }, "expansion": "First attested in the Gyechuk ilgi (癸丑日記 / 계축일기), c. 1600 , as Early Modern Korean 쪽 (Yale: ccwok).", "name": "ko-etym-native" } ], "etymology_text": "First attested in the Gyechuk ilgi (癸丑日記 / 계축일기), c. 1600 , as Early Modern Korean 쪽 (Yale: ccwok).", "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "dependent" }, "expansion": "쪽 • (jjok)", "name": "ko-pos" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "glosses": [ "side" ], "id": "en-쪽-ko-noun-6nv0u3Iw", "links": [ [ "side", "side" ] ], "tags": [ "dependent" ] }, { "categories": [ { "_dis": "16 53 16 16", "kind": "other", "name": "Native Korean words", "parents": [], "source": "w+disamb" } ], "glosses": [ "direction of approach or movement" ], "id": "en-쪽-ko-noun-r20fwSfv", "links": [ [ "direction", "direction" ] ], "tags": [ "dependent" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "derived": [ { "_dis1": "0 0", "english": "Jap", "roman": "jjokbari", "word": "쪽발이" }, { "_dis1": "0 0", "english": "note, slip of paper", "roman": "jjokji", "word": "쪽지" } ], "etymology_number": 2, "etymology_templates": [ { "args": { "1": "pts", "2": "ᄧᅩᆨ", "3": "pcwok" }, "expansion": "First attested in the Bak Tongsa eonhae (朴通事諺解 / 박통사언해), 1677, as Early Modern Korean ᄧᅩᆨ (Yale: pcwok).", "name": "ko-etym-native" } ], "etymology_text": "First attested in the Bak Tongsa eonhae (朴通事諺解 / 박통사언해), 1677, as Early Modern Korean ᄧᅩᆨ (Yale: pcwok).", "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "쪽 • (jjok)", "name": "ko-noun" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "related": [ { "_dis1": "0 0", "roman": "bubun", "word": "부분" }, { "_dis1": "0 0", "roman": "ilbu", "word": "일부" }, { "_dis1": "0 0", "roman": "jogak", "word": "조각" } ], "senses": [ { "glosses": [ "a part, piece" ], "id": "en-쪽-ko-noun-Hw~aVsIX", "links": [ [ "part", "part" ], [ "piece", "piece" ] ] }, { "glosses": [ "page" ], "id": "en-쪽-ko-noun-NmAxWprz", "links": [ [ "page", "page" ] ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "derived": [ { "_dis1": "0 0 0 0 0 0 0 0 0", "roman": "jjokjjok", "word": "쪽쪽" } ], "etymology_number": 3, "etymology_templates": [ { "args": { "1": "족" }, "expansion": "족 (jok)", "name": "ko-l" } ], "etymology_text": "Intensive form of 족 (jok).", "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "ideophone" }, "expansion": "쪽 • (jjok)", "name": "ko-pos" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "categories": [ { "_dis": "0 6 0 0 23 7 8 6 1 17 3 1 12 2 0 13", "kind": "other", "name": "Korean entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "1 10 1 1 17 10 8 6 2 14 4 2 9 3 1 11", "kind": "other", "name": "Korean terms with redundant script codes", "parents": [ "Terms with redundant script codes", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "0 7 0 0 20 8 8 6 1 16 3 1 11 2 0 14", "kind": "other", "name": "Korean terms with redundant transliterations", "parents": [ "Terms with redundant transliterations", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "0 3 0 7 23 4 8 6 1 17 3 1 11 2 0 12", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "0 2 0 7 25 6 7 6 1 18 1 1 12 1 0 13", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "30 6 8 7 3 22 3 2 15 3", "kind": "other", "name": "Korean ideophones", "parents": [], "source": "w+disamb" }, { "_dis": "1 5 1 1 19 6 9 6 2 16 4 3 9 3 1 14", "kind": "lifeform", "langcode": "ko", "name": "Buckwheat family plants", "orig": "ko:Buckwheat family plants", "parents": [ "Caryophyllales order plants", "Plants", "Lifeforms", "All topics", "Life", "Fundamental", "Nature" ], "source": "w+disamb" } ], "glosses": [ "in a manner indeed arranged in a row; while indeed arranging in a row" ], "id": "en-쪽-ko-noun-GB-p6vjH", "links": [ [ "arrange", "arrange" ] ], "raw_glosses": [ "(of small objects) in a manner indeed arranged in a row; while indeed arranging in a row" ], "raw_tags": [ "of small objects", "ideophone" ] }, { "categories": [ { "_dis": "1 10 1 1 17 10 8 6 2 14 4 2 9 3 1 11", "kind": "other", "name": "Korean terms with redundant script codes", "parents": [ "Terms with redundant script codes", "Entry maintenance" ], "source": "w+disamb" } ], "glosses": [ "without any sort of break; in one single seating" ], "id": "en-쪽-ko-noun-sBvhVTzD", "links": [ [ "break", "break" ], [ "single", "single" ], [ "seating", "seating" ] ], "raw_glosses": [ "(of a recitation or story) without any sort of break; in one single seating" ], "raw_tags": [ "of a recitation or story", "ideophone" ] }, { "glosses": [ "tearing in one forceful continuous stroke" ], "id": "en-쪽-ko-noun-e92-gBkb", "links": [ [ "tear", "tear" ], [ "one", "one" ], [ "forceful", "forceful" ], [ "continuous", "continuous" ], [ "stroke", "stroke" ] ], "raw_glosses": [ "(of a small thing) tearing in one forceful continuous stroke" ], "raw_tags": [ "of a small thing", "ideophone" ] }, { "glosses": [ "sucking or gulping in one forceful continuous stroke" ], "id": "en-쪽-ko-noun-pP7WpTfj", "links": [ [ "suck", "suck" ], [ "gulp", "gulp" ], [ "one", "one" ], [ "forceful", "forceful" ], [ "continuous", "continuous" ], [ "stroke", "stroke" ] ], "raw_glosses": [ "(of a small amount of liquid) sucking or gulping in one forceful continuous stroke" ], "raw_tags": [ "of a small amount of liquid", "ideophone" ] }, { "glosses": [ "stretching in a broad manner" ], "id": "en-쪽-ko-noun-EdIWy6gK", "links": [ [ "stretch", "stretch" ], [ "broad", "broad" ] ], "raw_glosses": [ "(of a small thing) stretching in a broad manner" ], "raw_tags": [ "of a small thing", "ideophone" ] }, { "categories": [ { "_dis": "1 10 1 1 17 10 8 6 2 14 4 2 9 3 1 11", "kind": "other", "name": "Korean terms with redundant script codes", "parents": [ "Terms with redundant script codes", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "1 5 1 1 19 6 9 6 2 16 4 3 9 3 1 14", "kind": "lifeform", "langcode": "ko", "name": "Buckwheat family plants", "orig": "ko:Buckwheat family plants", "parents": [ "Caryophyllales order plants", "Plants", "Lifeforms", "All topics", "Life", "Fundamental", "Nature" ], "source": "w+disamb" } ], "glosses": [ "looking over in a forceful glance (over a relatively small area)" ], "id": "en-쪽-ko-noun-ryRqh94Y", "links": [ [ "looking over", "look over" ], [ "forceful", "forceful" ], [ "glance", "glance" ] ], "raw_tags": [ "ideophone" ] }, { "glosses": [ "while being split or cut in a single stroke" ], "id": "en-쪽-ko-noun-iQV10Utc", "links": [ [ "split", "split" ], [ "cut", "cut" ] ], "raw_glosses": [ "(of a small object) while being split or cut in a single stroke" ], "raw_tags": [ "of a small object", "ideophone" ] }, { "glosses": [ "while being drained (both literally and metaphorically)" ], "id": "en-쪽-ko-noun-6o0P565p", "links": [ [ "drained", "drained" ] ], "raw_tags": [ "ideophone" ] }, { "glosses": [ "fashionably; sexily" ], "id": "en-쪽-ko-noun-uiTLNTnp", "links": [ [ "fashionably", "fashionably" ], [ "sexily", "sexily" ] ], "raw_tags": [ "ideophone" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "etymology_number": 4, "etymology_text": "Onomatopoeic.", "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "ideophone" }, "expansion": "쪽 • (jjok)", "name": "ko-pos" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Korean onomatopoeias", "parents": [], "source": "w" } ], "derived": [ { "english": "while repeatedly kissing", "roman": "jjokjjok", "word": "쪽쪽" } ], "glosses": [ "while kissing once" ], "id": "en-쪽-ko-noun-kgVkWtN0", "links": [ [ "onomatopoeia", "onomatopoeia" ], [ "kiss", "kiss" ] ], "raw_glosses": [ "(onomatopoeia) while kissing once" ], "raw_tags": [ "ideophone" ], "tags": [ "onomatopoeic" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "etymology_number": 5, "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "쪽 • (jjok)", "name": "ko-noun" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "categories": [], "derived": [ { "english": "ashamed, shameful", "roman": "jjokpallida", "word": "쪽팔리다" } ], "glosses": [ "face" ], "id": "en-쪽-ko-noun-AoLZt59C", "links": [ [ "face", "face" ] ], "raw_glosses": [ "(vulgar) face" ], "tags": [ "vulgar" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "etymology_number": 6, "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "쪽 • (jjok)", "name": "ko-noun" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "categories": [ { "_dis": "1 10 1 1 17 10 8 6 2 14 4 2 9 3 1 11", "kind": "other", "name": "Korean terms with redundant script codes", "parents": [ "Terms with redundant script codes", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "1 5 1 1 19 6 9 6 2 16 4 3 9 3 1 14", "kind": "lifeform", "langcode": "ko", "name": "Buckwheat family plants", "orig": "ko:Buckwheat family plants", "parents": [ "Caryophyllales order plants", "Plants", "Lifeforms", "All topics", "Life", "Fundamental", "Nature" ], "source": "w+disamb" } ], "glosses": [ "Japanese indigo (Persicaria tinctoria)" ], "id": "en-쪽-ko-noun-tcN8cbvY" } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" }
{ "categories": [ "Korean dependent nouns", "Korean entries with incorrect language header", "Korean lemmas", "Korean nouns", "Korean terms derived from Early Modern Korean", "Korean terms inherited from Early Modern Korean", "Korean terms with IPA pronunciation", "Korean terms with audio links", "Korean terms with redundant script codes", "Korean terms with redundant transliterations", "Native Korean words", "Pages with 1 entry", "Pages with entries", "ko:Buckwheat family plants" ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "gci", "2": "쪽", "3": "ccwok" }, "expansion": "First attested in the Gyechuk ilgi (癸丑日記 / 계축일기), c. 1600 , as Early Modern Korean 쪽 (Yale: ccwok).", "name": "ko-etym-native" } ], "etymology_text": "First attested in the Gyechuk ilgi (癸丑日記 / 계축일기), c. 1600 , as Early Modern Korean 쪽 (Yale: ccwok).", "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "dependent" }, "expansion": "쪽 • (jjok)", "name": "ko-pos" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "glosses": [ "side" ], "links": [ [ "side", "side" ] ], "tags": [ "dependent" ] }, { "glosses": [ "direction of approach or movement" ], "links": [ [ "direction", "direction" ] ], "tags": [ "dependent" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "categories": [ "Korean entries with incorrect language header", "Korean lemmas", "Korean nouns", "Korean terms derived from Early Modern Korean", "Korean terms inherited from Early Modern Korean", "Korean terms with IPA pronunciation", "Korean terms with audio links", "Korean terms with redundant script codes", "Korean terms with redundant transliterations", "Native Korean words", "Pages with 1 entry", "Pages with entries", "ko:Buckwheat family plants" ], "derived": [ { "english": "Jap", "roman": "jjokbari", "word": "쪽발이" }, { "english": "note, slip of paper", "roman": "jjokji", "word": "쪽지" } ], "etymology_number": 2, "etymology_templates": [ { "args": { "1": "pts", "2": "ᄧᅩᆨ", "3": "pcwok" }, "expansion": "First attested in the Bak Tongsa eonhae (朴通事諺解 / 박통사언해), 1677, as Early Modern Korean ᄧᅩᆨ (Yale: pcwok).", "name": "ko-etym-native" } ], "etymology_text": "First attested in the Bak Tongsa eonhae (朴通事諺解 / 박통사언해), 1677, as Early Modern Korean ᄧᅩᆨ (Yale: pcwok).", "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "쪽 • (jjok)", "name": "ko-noun" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "related": [ { "roman": "bubun", "word": "부분" }, { "roman": "ilbu", "word": "일부" }, { "roman": "jogak", "word": "조각" } ], "senses": [ { "glosses": [ "a part, piece" ], "links": [ [ "part", "part" ], [ "piece", "piece" ] ] }, { "glosses": [ "page" ], "links": [ [ "page", "page" ] ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "categories": [ "Korean entries with incorrect language header", "Korean ideophones", "Korean lemmas", "Korean nouns", "Korean terms with IPA pronunciation", "Korean terms with audio links", "Korean terms with redundant script codes", "Korean terms with redundant transliterations", "Korean yang-vowel forms", "Pages with 1 entry", "Pages with entries", "ko:Buckwheat family plants" ], "derived": [ { "roman": "jjokjjok", "word": "쪽쪽" } ], "etymology_number": 3, "etymology_templates": [ { "args": { "1": "족" }, "expansion": "족 (jok)", "name": "ko-l" } ], "etymology_text": "Intensive form of 족 (jok).", "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "ideophone" }, "expansion": "쪽 • (jjok)", "name": "ko-pos" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "glosses": [ "in a manner indeed arranged in a row; while indeed arranging in a row" ], "links": [ [ "arrange", "arrange" ] ], "raw_glosses": [ "(of small objects) in a manner indeed arranged in a row; while indeed arranging in a row" ], "raw_tags": [ "of small objects", "ideophone" ] }, { "glosses": [ "without any sort of break; in one single seating" ], "links": [ [ "break", "break" ], [ "single", "single" ], [ "seating", "seating" ] ], "raw_glosses": [ "(of a recitation or story) without any sort of break; in one single seating" ], "raw_tags": [ "of a recitation or story", "ideophone" ] }, { "glosses": [ "tearing in one forceful continuous stroke" ], "links": [ [ "tear", "tear" ], [ "one", "one" ], [ "forceful", "forceful" ], [ "continuous", "continuous" ], [ "stroke", "stroke" ] ], "raw_glosses": [ "(of a small thing) tearing in one forceful continuous stroke" ], "raw_tags": [ "of a small thing", "ideophone" ] }, { "glosses": [ "sucking or gulping in one forceful continuous stroke" ], "links": [ [ "suck", "suck" ], [ "gulp", "gulp" ], [ "one", "one" ], [ "forceful", "forceful" ], [ "continuous", "continuous" ], [ "stroke", "stroke" ] ], "raw_glosses": [ "(of a small amount of liquid) sucking or gulping in one forceful continuous stroke" ], "raw_tags": [ "of a small amount of liquid", "ideophone" ] }, { "glosses": [ "stretching in a broad manner" ], "links": [ [ "stretch", "stretch" ], [ "broad", "broad" ] ], "raw_glosses": [ "(of a small thing) stretching in a broad manner" ], "raw_tags": [ "of a small thing", "ideophone" ] }, { "glosses": [ "looking over in a forceful glance (over a relatively small area)" ], "links": [ [ "looking over", "look over" ], [ "forceful", "forceful" ], [ "glance", "glance" ] ], "raw_tags": [ "ideophone" ] }, { "glosses": [ "while being split or cut in a single stroke" ], "links": [ [ "split", "split" ], [ "cut", "cut" ] ], "raw_glosses": [ "(of a small object) while being split or cut in a single stroke" ], "raw_tags": [ "of a small object", "ideophone" ] }, { "glosses": [ "while being drained (both literally and metaphorically)" ], "links": [ [ "drained", "drained" ] ], "raw_tags": [ "ideophone" ] }, { "glosses": [ "fashionably; sexily" ], "links": [ [ "fashionably", "fashionably" ], [ "sexily", "sexily" ] ], "raw_tags": [ "ideophone" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "categories": [ "Korean entries with incorrect language header", "Korean ideophones", "Korean lemmas", "Korean nouns", "Korean terms with IPA pronunciation", "Korean terms with audio links", "Korean terms with redundant script codes", "Korean terms with redundant transliterations", "Pages with 1 entry", "Pages with entries", "ko:Buckwheat family plants" ], "derived": [ { "english": "while repeatedly kissing", "roman": "jjokjjok", "word": "쪽쪽" } ], "etymology_number": 4, "etymology_text": "Onomatopoeic.", "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": { "1": "ideophone" }, "expansion": "쪽 • (jjok)", "name": "ko-pos" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "categories": [ "Korean onomatopoeias" ], "glosses": [ "while kissing once" ], "links": [ [ "onomatopoeia", "onomatopoeia" ], [ "kiss", "kiss" ] ], "raw_glosses": [ "(onomatopoeia) while kissing once" ], "raw_tags": [ "ideophone" ], "tags": [ "onomatopoeic" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "categories": [ "Korean entries with incorrect language header", "Korean lemmas", "Korean nouns", "Korean terms with IPA pronunciation", "Korean terms with audio links", "Korean terms with redundant script codes", "Korean terms with redundant transliterations", "Pages with 1 entry", "Pages with entries", "ko:Buckwheat family plants" ], "derived": [ { "english": "ashamed, shameful", "roman": "jjokpallida", "word": "쪽팔리다" } ], "etymology_number": 5, "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "쪽 • (jjok)", "name": "ko-noun" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "categories": [ "Korean vulgarities" ], "glosses": [ "face" ], "links": [ [ "face", "face" ] ], "raw_glosses": [ "(vulgar) face" ], "tags": [ "vulgar" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" } { "categories": [ "Korean entries with incorrect language header", "Korean lemmas", "Korean nouns", "Korean terms with IPA pronunciation", "Korean terms with audio links", "Korean terms with redundant script codes", "Korean terms with redundant transliterations", "Pages with 1 entry", "Pages with entries", "ko:Buckwheat family plants" ], "etymology_number": 6, "forms": [ { "form": "jjok", "tags": [ "romanization" ] } ], "head_templates": [ { "args": {}, "expansion": "쪽 • (jjok)", "name": "ko-noun" } ], "lang": "Korean", "lang_code": "ko", "pos": "noun", "senses": [ { "categories": [ "Entries missing English vernacular names of taxa", "Entries using missing taxonomic name (species)" ], "glosses": [ "Japanese indigo (Persicaria tinctoria)" ] } ], "sounds": [ { "ipa": "[t͡ɕ͈o̞k̚]", "tags": [ "SK-Standard", "Seoul" ] }, { "hangeul": "쪽" }, { "other": "[쪽]" } ], "word": "쪽" }
Download raw JSONL data for 쪽 meaning in All languages combined (8.9kB)
This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2024-11-06 from the enwiktionary dump dated 2024-10-02 using wiktextract (fbeafe8 and 7f03c9b). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.