See உலகம் in All languages combined, or Wiktionary
{ "derived": [ { "_dis1": "0 0", "roman": "ulakakarttā", "word": "உலககர்த்தா" }, { "_dis1": "0 0", "roman": "ulakacañcāram", "word": "உலகசஞ்சாரம்" }, { "_dis1": "0 0", "roman": "ulakacayaṉ", "word": "உலகசயன்" }, { "_dis1": "0 0", "roman": "ulakañāṉam", "word": "உலகஞானம்" }, { "_dis1": "0 0", "roman": "ulakattār", "word": "உலகத்தார்" }, { "_dis1": "0 0", "roman": "ulakanātaṉ", "word": "உலகநாதன்" }, { "_dis1": "0 0", "roman": "ulakanīti", "word": "உலகநீதி" }, { "_dis1": "0 0", "roman": "ulakapattati", "word": "உலகபத்ததி" }, { "_dis1": "0 0", "roman": "ulakapālar", "word": "உலகபாலர்" }, { "_dis1": "0 0", "roman": "ulakappaṟṟu", "word": "உலகப்பற்று" }, { "_dis1": "0 0", "roman": "ulakappiracitti", "word": "உலகப்பிரசித்தி" }, { "_dis1": "0 0", "roman": "ulakappuraṭṭaṉ", "word": "உலகப்புரட்டன்" }, { "_dis1": "0 0", "roman": "ulakamaṉṉavaṉ", "word": "உலகமன்னவன்" }, { "_dis1": "0 0", "roman": "ulakamariyātai", "word": "உலகமரியாதை" }, { "_dis1": "0 0", "roman": "ulakamalaiyāmai", "word": "உலகமலையாமை" }, { "_dis1": "0 0", "roman": "ulakamalaivu", "word": "உலகமலைவு" }, { "_dis1": "0 0", "roman": "ulakamaḷantāṉ", "word": "உலகமளந்தான்" }, { "_dis1": "0 0", "roman": "ulakamātā", "word": "உலகமாதா" }, { "_dis1": "0 0", "roman": "ulakamuṇṭōṉ", "word": "உலகமுண்டோன்" }, { "_dis1": "0 0", "roman": "ulakayāttirai", "word": "உலகயாத்திரை" }, { "_dis1": "0 0", "roman": "ulakarīti", "word": "உலகரீதி" }, { "_dis1": "0 0", "roman": "ulakar", "word": "உலகர்" }, { "_dis1": "0 0", "roman": "ulakaḷavu", "word": "உலகளவு" }, { "_dis1": "0 0", "roman": "ulakavaṟavi", "word": "உலகவறவி" }, { "_dis1": "0 0", "roman": "ulakavaṟivu", "word": "உலகவறிவு" }, { "_dis1": "0 0", "roman": "ulakavaḻakkam", "word": "உலகவழக்கம்" }, { "_dis1": "0 0", "roman": "ulakavaḻakku", "word": "உலகவழக்கு" }, { "_dis1": "0 0", "roman": "ulakavāñcai", "word": "உலகவாஞ்சை" }, { "_dis1": "0 0", "roman": "ulakavātam", "word": "உலகவாதம்" }, { "_dis1": "0 0", "roman": "ulakavārttai", "word": "உலகவார்த்தை" }, { "_dis1": "0 0", "roman": "ulakavāḻvu", "word": "உலகவாழ்வு" }, { "_dis1": "0 0", "roman": "ulakaviṭaikaḻi", "word": "உலகவிடைகழி" }, { "_dis1": "0 0", "roman": "ulakaviyāpāram", "word": "உலகவியாபாரம்" }, { "_dis1": "0 0", "roman": "ulakaviruttam", "word": "உலகவிருத்தம்" }, { "_dis1": "0 0", "roman": "ulakavēṭaṇai", "word": "உலகவேடணை" }, { "_dis1": "0 0", "roman": "ulakikam", "word": "உலகிகம்" }, { "_dis1": "0 0", "roman": "ulakitaṉ", "word": "உலகிதன்" }, { "_dis1": "0 0", "roman": "ulakiyaṟcol", "word": "உலகியற்சொல்" }, { "_dis1": "0 0", "roman": "ulakiyal", "word": "உலகியல்" }, { "_dis1": "0 0", "roman": "ulakiyalvaḻakku", "word": "உலகியல்வழக்கு" }, { "_dis1": "0 0", "roman": "ulakuṭaiya perumāḷ", "word": "உலகுடைய பெருமாள்" }, { "_dis1": "0 0", "roman": "ulakēṭaṇai", "word": "உலகேடணை" }, { "_dis1": "0 0", "roman": "ēḻulakam", "word": "ஏழுலகம்" }, { "_dis1": "0 0", "roman": "kīḻulaku", "word": "கீழுலகு" }, { "_dis1": "0 0", "roman": "cellulaku", "word": "செல்லுலகு" }, { "_dis1": "0 0", "roman": "nilavulakam", "word": "நிலவுலகம்" }, { "_dis1": "0 0", "roman": "pūvulaku", "word": "பூவுலகு" }, { "_dis1": "0 0", "roman": "maṇṇulaku", "word": "மண்ணுலகு" }, { "_dis1": "0 0", "roman": "mēlulakam", "word": "மேலுலகம்" }, { "_dis1": "0 0", "roman": "mēlaiyulaku", "word": "மேலையுலகு" } ], "etymology_templates": [ { "args": { "1": "ta", "2": "sa", "3": "लोक" }, "expansion": "Borrowed from Sanskrit लोक (loka)", "name": "bor+" }, { "args": { "1": "ta", "2": "லோகம்" }, "expansion": "Doublet of லோகம் (lōkam)", "name": "dbt" } ], "etymology_text": "Borrowed from Sanskrit लोक (loka). Doublet of லோகம் (lōkam).", "forms": [ { "form": "ulakam", "tags": [ "romanization" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "ta-decl", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "m-stem", "source": "declension", "tags": [ "class" ] }, { "form": "உலகம்", "roman": "ulakam", "source": "declension", "tags": [ "nominative", "singular" ] }, { "form": "உலகங்கள்", "roman": "ulakaṅkaḷ", "source": "declension", "tags": [ "nominative", "plural" ] }, { "form": "உலகமே", "roman": "ulakamē", "source": "declension", "tags": [ "singular", "vocative" ] }, { "form": "உலகங்களே", "roman": "ulakaṅkaḷē", "source": "declension", "tags": [ "plural", "vocative" ] }, { "form": "உலகத்தை", "roman": "ulakattai", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "உலகங்களை", "roman": "ulakaṅkaḷai", "source": "declension", "tags": [ "accusative", "plural" ] }, { "form": "உலகத்துக்கு", "roman": "ulakattukku", "source": "declension", "tags": [ "dative", "singular" ] }, { "form": "உலகங்களுக்கு", "roman": "ulakaṅkaḷukku", "source": "declension", "tags": [ "dative", "plural" ] }, { "form": "உலகத்துக்காக", "roman": "ulakattukkāka", "source": "declension", "tags": [ "benefactive", "singular" ] }, { "form": "உலகங்களுக்காக", "roman": "ulakaṅkaḷukkāka", "source": "declension", "tags": [ "benefactive", "plural" ] }, { "form": "உலகத்துடைய", "roman": "ulakattuṭaiya", "source": "declension", "tags": [ "genitive", "genitive-i", "singular" ] }, { "form": "உலகங்களுடைய", "roman": "ulakaṅkaḷuṭaiya", "source": "declension", "tags": [ "genitive", "genitive-i", "plural" ] }, { "form": "உலகத்தின்", "roman": "ulakattiṉ", "source": "declension", "tags": [ "genitive", "genitive-ii", "singular" ] }, { "form": "உலகங்களின்", "roman": "ulakaṅkaḷiṉ", "source": "declension", "tags": [ "genitive", "genitive-ii", "plural" ] }, { "form": "உலகத்தில்", "roman": "ulakattil", "source": "declension", "tags": [ "locative", "locative-i", "singular" ] }, { "form": "உலகங்களில்", "roman": "ulakaṅkaḷil", "source": "declension", "tags": [ "locative", "locative-i", "plural" ] }, { "form": "உலகத்திடம்", "roman": "ulakattiṭam", "source": "declension", "tags": [ "locative", "locative-ii", "singular" ] }, { "form": "உலகங்களிடம்", "roman": "ulakaṅkaḷiṭam", "source": "declension", "tags": [ "locative", "locative-ii", "plural" ] }, { "form": "உலகத்தோடு", "roman": "ulakattōṭu", "source": "declension", "tags": [ "singular", "sociative", "sociative-i" ] }, { "form": "உலகங்களோடு", "roman": "ulakaṅkaḷōṭu", "source": "declension", "tags": [ "plural", "sociative", "sociative-i" ] }, { "form": "உலகத்துடன்", "roman": "ulakattuṭaṉ", "source": "declension", "tags": [ "singular", "sociative", "sociative-ii" ] }, { "form": "உலகங்களுடன்", "roman": "ulakaṅkaḷuṭaṉ", "source": "declension", "tags": [ "plural", "sociative", "sociative-ii" ] }, { "form": "உலகத்தால்", "roman": "ulakattāl", "source": "declension", "tags": [ "instrumental", "singular" ] }, { "form": "உலகங்களால்", "roman": "ulakaṅkaḷāl", "source": "declension", "tags": [ "instrumental", "plural" ] }, { "form": "உலகத்திலிருந்து", "roman": "ulakattiliruntu", "source": "declension", "tags": [ "ablative", "singular" ] }, { "form": "உலகங்களிலிருந்து", "roman": "ulakaṅkaḷiliruntu", "source": "declension", "tags": [ "ablative", "plural" ] } ], "head_templates": [ { "args": { "tr": "ulakam" }, "expansion": "உலகம் • (ulakam)", "name": "ta-noun" } ], "inflection_templates": [ { "args": {}, "name": "ta-decl" } ], "lang": "Tamil", "lang_code": "ta", "pos": "noun", "senses": [ { "categories": [ { "_dis": "50 50", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "46 54", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "45 55", "kind": "other", "name": "Tamil entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "45 55", "kind": "other", "name": "Tamil terms with redundant script codes", "parents": [ "Terms with redundant script codes", "Entry maintenance" ], "source": "w+disamb" } ], "glosses": [ "world, earth" ], "id": "en-உலகம்-ta-noun-Rqzf0fOn", "links": [ [ "world", "world" ], [ "earth", "earth" ] ], "synonyms": [ { "word": "உலகம்" } ] }, { "categories": [ { "_dis": "50 50", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "46 54", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "45 55", "kind": "other", "name": "Tamil entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "45 55", "kind": "other", "name": "Tamil terms with redundant script codes", "parents": [ "Terms with redundant script codes", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "33 67", "kind": "topical", "langcode": "ta", "name": "Planets", "orig": "ta:Planets", "parents": [ "Celestial bodies", "Space", "Nature", "All topics", "Fundamental" ], "source": "w+disamb" } ], "glosses": [ "planet" ], "id": "en-உலகம்-ta-noun-y1gV~lw8", "links": [ [ "planet", "planet" ] ], "synonyms": [ { "word": "கோள்" }, { "word": "கிரகம்" } ] } ], "sounds": [ { "ipa": "/ʊlɐɡɐm/" } ], "synonyms": [ { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "பார்" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "ஞாலம்" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "ஜகம்" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "வையகம்" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "பூமி" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "உலகம்" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "அண்டம்" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "லோகம்" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "அகிலம்" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "அவனி" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "தரணி" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "காசினி" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "மேதினி" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "புவி" }, { "_dis1": "0 0", "source": "Thesaurus:உலகம்", "word": "ஊழி" } ], "word": "உலகம்" }
{ "categories": [ "Pages with 1 entry", "Pages with entries", "Tamil doublets", "Tamil entries with incorrect language header", "Tamil lemmas", "Tamil m-stem nouns", "Tamil nouns", "Tamil terms borrowed from Sanskrit", "Tamil terms derived from Sanskrit", "Tamil terms with IPA pronunciation", "Tamil terms with redundant script codes", "ta:Planets" ], "derived": [ { "roman": "ulakakarttā", "word": "உலககர்த்தா" }, { "roman": "ulakacañcāram", "word": "உலகசஞ்சாரம்" }, { "roman": "ulakacayaṉ", "word": "உலகசயன்" }, { "roman": "ulakañāṉam", "word": "உலகஞானம்" }, { "roman": "ulakattār", "word": "உலகத்தார்" }, { "roman": "ulakanātaṉ", "word": "உலகநாதன்" }, { "roman": "ulakanīti", "word": "உலகநீதி" }, { "roman": "ulakapattati", "word": "உலகபத்ததி" }, { "roman": "ulakapālar", "word": "உலகபாலர்" }, { "roman": "ulakappaṟṟu", "word": "உலகப்பற்று" }, { "roman": "ulakappiracitti", "word": "உலகப்பிரசித்தி" }, { "roman": "ulakappuraṭṭaṉ", "word": "உலகப்புரட்டன்" }, { "roman": "ulakamaṉṉavaṉ", "word": "உலகமன்னவன்" }, { "roman": "ulakamariyātai", "word": "உலகமரியாதை" }, { "roman": "ulakamalaiyāmai", "word": "உலகமலையாமை" }, { "roman": "ulakamalaivu", "word": "உலகமலைவு" }, { "roman": "ulakamaḷantāṉ", "word": "உலகமளந்தான்" }, { "roman": "ulakamātā", "word": "உலகமாதா" }, { "roman": "ulakamuṇṭōṉ", "word": "உலகமுண்டோன்" }, { "roman": "ulakayāttirai", "word": "உலகயாத்திரை" }, { "roman": "ulakarīti", "word": "உலகரீதி" }, { "roman": "ulakar", "word": "உலகர்" }, { "roman": "ulakaḷavu", "word": "உலகளவு" }, { "roman": "ulakavaṟavi", "word": "உலகவறவி" }, { "roman": "ulakavaṟivu", "word": "உலகவறிவு" }, { "roman": "ulakavaḻakkam", "word": "உலகவழக்கம்" }, { "roman": "ulakavaḻakku", "word": "உலகவழக்கு" }, { "roman": "ulakavāñcai", "word": "உலகவாஞ்சை" }, { "roman": "ulakavātam", "word": "உலகவாதம்" }, { "roman": "ulakavārttai", "word": "உலகவார்த்தை" }, { "roman": "ulakavāḻvu", "word": "உலகவாழ்வு" }, { "roman": "ulakaviṭaikaḻi", "word": "உலகவிடைகழி" }, { "roman": "ulakaviyāpāram", "word": "உலகவியாபாரம்" }, { "roman": "ulakaviruttam", "word": "உலகவிருத்தம்" }, { "roman": "ulakavēṭaṇai", "word": "உலகவேடணை" }, { "roman": "ulakikam", "word": "உலகிகம்" }, { "roman": "ulakitaṉ", "word": "உலகிதன்" }, { "roman": "ulakiyaṟcol", "word": "உலகியற்சொல்" }, { "roman": "ulakiyal", "word": "உலகியல்" }, { "roman": "ulakiyalvaḻakku", "word": "உலகியல்வழக்கு" }, { "roman": "ulakuṭaiya perumāḷ", "word": "உலகுடைய பெருமாள்" }, { "roman": "ulakēṭaṇai", "word": "உலகேடணை" }, { "roman": "ēḻulakam", "word": "ஏழுலகம்" }, { "roman": "kīḻulaku", "word": "கீழுலகு" }, { "roman": "cellulaku", "word": "செல்லுலகு" }, { "roman": "nilavulakam", "word": "நிலவுலகம்" }, { "roman": "pūvulaku", "word": "பூவுலகு" }, { "roman": "maṇṇulaku", "word": "மண்ணுலகு" }, { "roman": "mēlulakam", "word": "மேலுலகம்" }, { "roman": "mēlaiyulaku", "word": "மேலையுலகு" } ], "etymology_templates": [ { "args": { "1": "ta", "2": "sa", "3": "लोक" }, "expansion": "Borrowed from Sanskrit लोक (loka)", "name": "bor+" }, { "args": { "1": "ta", "2": "லோகம்" }, "expansion": "Doublet of லோகம் (lōkam)", "name": "dbt" } ], "etymology_text": "Borrowed from Sanskrit लोक (loka). Doublet of லோகம் (lōkam).", "forms": [ { "form": "ulakam", "tags": [ "romanization" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "ta-decl", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "m-stem", "source": "declension", "tags": [ "class" ] }, { "form": "உலகம்", "roman": "ulakam", "source": "declension", "tags": [ "nominative", "singular" ] }, { "form": "உலகங்கள்", "roman": "ulakaṅkaḷ", "source": "declension", "tags": [ "nominative", "plural" ] }, { "form": "உலகமே", "roman": "ulakamē", "source": "declension", "tags": [ "singular", "vocative" ] }, { "form": "உலகங்களே", "roman": "ulakaṅkaḷē", "source": "declension", "tags": [ "plural", "vocative" ] }, { "form": "உலகத்தை", "roman": "ulakattai", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "உலகங்களை", "roman": "ulakaṅkaḷai", "source": "declension", "tags": [ "accusative", "plural" ] }, { "form": "உலகத்துக்கு", "roman": "ulakattukku", "source": "declension", "tags": [ "dative", "singular" ] }, { "form": "உலகங்களுக்கு", "roman": "ulakaṅkaḷukku", "source": "declension", "tags": [ "dative", "plural" ] }, { "form": "உலகத்துக்காக", "roman": "ulakattukkāka", "source": "declension", "tags": [ "benefactive", "singular" ] }, { "form": "உலகங்களுக்காக", "roman": "ulakaṅkaḷukkāka", "source": "declension", "tags": [ "benefactive", "plural" ] }, { "form": "உலகத்துடைய", "roman": "ulakattuṭaiya", "source": "declension", "tags": [ "genitive", "genitive-i", "singular" ] }, { "form": "உலகங்களுடைய", "roman": "ulakaṅkaḷuṭaiya", "source": "declension", "tags": [ "genitive", "genitive-i", "plural" ] }, { "form": "உலகத்தின்", "roman": "ulakattiṉ", "source": "declension", "tags": [ "genitive", "genitive-ii", "singular" ] }, { "form": "உலகங்களின்", "roman": "ulakaṅkaḷiṉ", "source": "declension", "tags": [ "genitive", "genitive-ii", "plural" ] }, { "form": "உலகத்தில்", "roman": "ulakattil", "source": "declension", "tags": [ "locative", "locative-i", "singular" ] }, { "form": "உலகங்களில்", "roman": "ulakaṅkaḷil", "source": "declension", "tags": [ "locative", "locative-i", "plural" ] }, { "form": "உலகத்திடம்", "roman": "ulakattiṭam", "source": "declension", "tags": [ "locative", "locative-ii", "singular" ] }, { "form": "உலகங்களிடம்", "roman": "ulakaṅkaḷiṭam", "source": "declension", "tags": [ "locative", "locative-ii", "plural" ] }, { "form": "உலகத்தோடு", "roman": "ulakattōṭu", "source": "declension", "tags": [ "singular", "sociative", "sociative-i" ] }, { "form": "உலகங்களோடு", "roman": "ulakaṅkaḷōṭu", "source": "declension", "tags": [ "plural", "sociative", "sociative-i" ] }, { "form": "உலகத்துடன்", "roman": "ulakattuṭaṉ", "source": "declension", "tags": [ "singular", "sociative", "sociative-ii" ] }, { "form": "உலகங்களுடன்", "roman": "ulakaṅkaḷuṭaṉ", "source": "declension", "tags": [ "plural", "sociative", "sociative-ii" ] }, { "form": "உலகத்தால்", "roman": "ulakattāl", "source": "declension", "tags": [ "instrumental", "singular" ] }, { "form": "உலகங்களால்", "roman": "ulakaṅkaḷāl", "source": "declension", "tags": [ "instrumental", "plural" ] }, { "form": "உலகத்திலிருந்து", "roman": "ulakattiliruntu", "source": "declension", "tags": [ "ablative", "singular" ] }, { "form": "உலகங்களிலிருந்து", "roman": "ulakaṅkaḷiliruntu", "source": "declension", "tags": [ "ablative", "plural" ] } ], "head_templates": [ { "args": { "tr": "ulakam" }, "expansion": "உலகம் • (ulakam)", "name": "ta-noun" } ], "inflection_templates": [ { "args": {}, "name": "ta-decl" } ], "lang": "Tamil", "lang_code": "ta", "pos": "noun", "senses": [ { "glosses": [ "world, earth" ], "links": [ [ "world", "world" ], [ "earth", "earth" ] ], "synonyms": [ { "word": "உலகம்" } ] }, { "glosses": [ "planet" ], "links": [ [ "planet", "planet" ] ], "synonyms": [ { "word": "கோள்" }, { "word": "கிரகம்" } ] } ], "sounds": [ { "ipa": "/ʊlɐɡɐm/" } ], "synonyms": [ { "source": "Thesaurus:உலகம்", "word": "பார்" }, { "source": "Thesaurus:உலகம்", "word": "ஞாலம்" }, { "source": "Thesaurus:உலகம்", "word": "ஜகம்" }, { "source": "Thesaurus:உலகம்", "word": "வையகம்" }, { "source": "Thesaurus:உலகம்", "word": "பூமி" }, { "source": "Thesaurus:உலகம்", "word": "உலகம்" }, { "source": "Thesaurus:உலகம்", "word": "அண்டம்" }, { "source": "Thesaurus:உலகம்", "word": "லோகம்" }, { "source": "Thesaurus:உலகம்", "word": "அகிலம்" }, { "source": "Thesaurus:உலகம்", "word": "அவனி" }, { "source": "Thesaurus:உலகம்", "word": "தரணி" }, { "source": "Thesaurus:உலகம்", "word": "காசினி" }, { "source": "Thesaurus:உலகம்", "word": "மேதினி" }, { "source": "Thesaurus:உலகம்", "word": "புவி" }, { "source": "Thesaurus:உலகம்", "word": "ஊழி" } ], "word": "உலகம்" }
Download raw JSONL data for உலகம் meaning in Tamil (9.3kB)
This page is a part of the kaikki.org machine-readable Tamil dictionary. This dictionary is based on structured data extracted on 2024-12-15 from the enwiktionary dump dated 2024-12-04 using wiktextract (8a39820 and 4401a4c). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.