See sorex in All languages combined, or Wiktionary
{ "derived": [ { "_dis1": "0 0", "word": "sōricīnus" } ], "descendants": [ { "depth": 1, "templates": [], "text": "Balkan Romance:" }, { "depth": 2, "templates": [ { "args": { "1": "rup", "2": "shoaric", "3": "shorãc" }, "expansion": "Aromanian: shoaric, shorãc", "name": "desc" } ], "text": "Aromanian: shoaric, shorãc" }, { "depth": 2, "templates": [ { "args": { "1": "ro", "2": "șoarece", "3": "șoarec" }, "expansion": "Romanian: șoarece, șoarec", "name": "desc" } ], "text": "Romanian: șoarece, șoarec" }, { "depth": 1, "templates": [], "text": "Dalmatian:" }, { "depth": 2, "templates": [ { "args": { "1": "dlm", "2": "surco", "nolb": "1" }, "expansion": "surco", "name": "desc" } ], "text": "surco" }, { "depth": 1, "templates": [], "text": "Italo-Romance:" }, { "depth": 2, "templates": [ { "args": { "1": "it", "2": "sorcio", "3": "sorice" }, "expansion": "Italian: sorcio, sorice", "name": "desc" }, { "args": { "1": "archaic" }, "expansion": "(archaic)", "name": "q" }, { "args": { "1": "Marche" }, "expansion": "(Marche)", "name": "q" } ], "text": "Italian: sorcio, sorice (archaic), sorca, sorga (Marche)" }, { "depth": 2, "templates": [ { "args": { "1": "nap", "2": "sorece" }, "expansion": "Neapolitan: sorece", "name": "desc" } ], "text": "Neapolitan: sorece" }, { "depth": 2, "templates": [ { "args": { "1": "scn", "2": "surci", "3": "sùrici" }, "expansion": "Sicilian: surci, sùrici", "name": "desc" } ], "text": "Sicilian: surci, sùrici" }, { "depth": 1, "templates": [], "text": "North Italian:" }, { "depth": 2, "templates": [ { "args": { "1": "fur", "2": "surîs" }, "expansion": "Friulian: surîs", "name": "desc" } ], "text": "Friulian: surîs" }, { "depth": 2, "templates": [ { "args": { "1": "lmo", "2": "sorec" }, "expansion": "Lombard: sorec", "name": "desc" } ], "text": "Lombard: sorec" }, { "depth": 2, "templates": [ { "args": { "1": "rm", "2": "schuorsch" }, "expansion": "Romansch: schuorsch", "name": "desc" } ], "text": "Romansch: schuorsch" }, { "depth": 2, "templates": [ { "args": { "1": "vec", "2": "sorxe" }, "expansion": "Venetan: sorxe", "name": "desc" } ], "text": "Venetan: sorxe" }, { "depth": 1, "templates": [], "text": "Gallo-Romance:" }, { "depth": 2, "templates": [ { "args": { "1": "fro", "2": "soris" }, "expansion": "Old French: soris", "name": "desc" } ], "text": "Old French: soris" }, { "depth": 3, "templates": [ { "args": { "1": "fr", "2": "souris" }, "expansion": "French: souris\nMichif: soorii", "name": "desctree" } ], "text": "French: souris\nMichif: soorii" }, { "depth": 3, "templates": [ { "args": { "1": "nrf", "2": "souoris" }, "expansion": "Norman: souoris", "name": "desc" } ], "text": "Norman: souoris" }, { "depth": 3, "templates": [ { "args": { "1": "pcd" }, "expansion": "Picard:", "name": "desc" } ], "text": "Picard:" }, { "depth": 3, "templates": [ { "args": { "1": "pcd", "2": "suris", "nolb": "1" }, "expansion": "suris", "name": "desc" } ], "text": "Northern: suris" }, { "depth": 3, "templates": [ { "args": { "1": "pcd", "2": "seris", "3": "seuris", "4": "soiris", "nolb": "1" }, "expansion": "seris, seuris, soiris", "name": "desc" } ], "text": "Southern: seris, seuris, soiris" }, { "depth": 3, "templates": [ { "args": { "1": "roa-poi", "2": "sourit", "der": "1" }, "expansion": "⇒ Poitevin-Saintongeais: sourit", "name": "desc" } ], "text": "⇒ Poitevin-Saintongeais: sourit" }, { "depth": 3, "templates": [ { "args": { "1": "wa", "2": "soris" }, "expansion": "Walloon: soris", "name": "desc" } ], "text": "Walloon: soris" }, { "depth": 1, "templates": [], "text": "West Iberian:" }, { "depth": 2, "templates": [ { "args": { "1": "osp", "2": "sorze" }, "expansion": "Old Spanish: sorze", "name": "desc" } ], "text": "Old Spanish: sorze" }, { "depth": 3, "templates": [ { "args": { "1": "es", "2": "sorce" }, "expansion": "Spanish: sorce", "name": "desc" } ], "text": "Spanish: sorce" }, { "depth": 1, "templates": [], "text": "Insular Romance:" }, { "depth": 2, "templates": [ { "args": { "1": "sc" }, "expansion": "Sardinian:", "name": "desc" } ], "text": "Sardinian:" }, { "depth": 3, "templates": [ { "args": { "1": "sc-src", "2": "sorighe" }, "expansion": "Logudorese: sorighe", "name": "desc" } ], "text": "Logudorese: sorighe" }, { "depth": 3, "templates": [ { "args": { "1": "sc-nuo", "2": "soriche" }, "expansion": "Nuorese: soriche", "name": "desc" } ], "text": "Nuorese: soriche" }, { "depth": 1, "templates": [ { "args": { "1": "Sorex", "2": "genus" }, "expansion": "Sorex", "name": "taxfmt" } ], "text": "Translingual: Sorex" }, { "depth": 1, "templates": [], "text": "Various derived terms meaning 'bat':" }, { "depth": 2, "templates": [ { "args": { "1": "dlm", "2": "surca pizigaun", "3": "surca pitsigaun", "der": "1" }, "expansion": "⇒ Dalmatian: surca pizigaun, surca pitsigaun", "name": "desc" } ], "text": "⇒ Dalmatian: surca pizigaun, surca pitsigaun" }, { "depth": 2, "templates": [ { "args": { "1": "fr", "2": "chauvesouris", "der": "1" }, "expansion": "⇒ French: chauvesouris", "name": "desc" } ], "text": "⇒ French: chauvesouris" }, { "depth": 2, "templates": [ { "args": { "1": "oc", "2": "soritz pennada", "der": "1" }, "expansion": "⇒ Occitan: soritz pennada", "name": "desc" } ], "text": "⇒ Occitan: soritz pennada" }, { "depth": 2, "templates": [ { "args": { "1": "sc", "2": "sorighe pinnadulu", "der": "1" }, "expansion": "⇒ Sardinian: sorighe pinnadulu", "name": "desc" } ], "text": "⇒ Sardinian: sorighe pinnadulu" }, { "depth": 2, "templates": [ { "args": { "1": "scn", "2": "suriğe ulateu", "3": "sorici occelli", "der": "1" }, "expansion": "⇒ Sicilian: suriğe ulateu, sorici occelli", "name": "desc" }, { "args": { "1": "Calabria" }, "expansion": "(Calabria)", "name": "q" } ], "text": "⇒ Sicilian: suriğe ulateu, sorici occelli (Calabria)" } ], "etymology_templates": [ { "args": { "1": "la" }, "expansion": "Uncertain", "name": "unc" }, { "args": { "1": "la", "2": "grc", "3": "ὕραξ", "4": "", "5": "shrewmouse" }, "expansion": "Ancient Greek ὕραξ (húrax, “shrewmouse”)", "name": "der" } ], "etymology_text": "Uncertain; possibly related to susurrus (“whisper, rustling”), or Ancient Greek ὕραξ (húrax, “shrewmouse”).", "forms": [ { "form": "sōrex", "tags": [ "canonical", "masculine" ] }, { "form": "sōricis", "tags": [ "genitive" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "la-ndecl", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "sōrex", "source": "declension", "tags": [ "nominative", "singular" ] }, { "form": "sōricēs", "source": "declension", "tags": [ "nominative", "plural" ] }, { "form": "sōricis", "source": "declension", "tags": [ "genitive", "singular" ] }, { "form": "sōricum", "source": "declension", "tags": [ "genitive", "plural" ] }, { "form": "sōricī", "source": "declension", "tags": [ "dative", "singular" ] }, { "form": "sōricibus", "source": "declension", "tags": [ "dative", "plural" ] }, { "form": "sōricem", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "sōricēs", "source": "declension", "tags": [ "accusative", "plural" ] }, { "form": "sōrice", "source": "declension", "tags": [ "ablative", "singular" ] }, { "form": "sōricibus", "source": "declension", "tags": [ "ablative", "plural" ] }, { "form": "sōrex", "source": "declension", "tags": [ "singular", "vocative" ] }, { "form": "sōricēs", "source": "declension", "tags": [ "plural", "vocative" ] } ], "head_templates": [ { "args": { "1": "sōrex<3>", "g": "m" }, "expansion": "sōrex m (genitive sōricis); third declension", "name": "la-noun" } ], "inflection_templates": [ { "args": { "1": "sōrex<3>" }, "name": "la-ndecl" } ], "lang": "Latin", "lang_code": "la", "pos": "noun", "senses": [ { "categories": [ { "_dis": "46 54", "kind": "other", "name": "Latin entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "46 54", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "46 54", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "47 53", "kind": "lifeform", "langcode": "la", "name": "Rodents", "orig": "la:Rodents", "parents": [ "Mammals", "Vertebrates", "Chordates", "Animals", "Lifeforms", "All topics", "Life", "Fundamental", "Nature" ], "source": "w+disamb" }, { "_dis": "50 50", "kind": "lifeform", "langcode": "la", "name": "Soricomorphs", "orig": "la:Soricomorphs", "parents": [ "Mammals", "Vertebrates", "Chordates", "Animals", "Lifeforms", "All topics", "Life", "Fundamental", "Nature" ], "source": "w+disamb" } ], "glosses": [ "shrew, shrewmouse" ], "id": "en-sorex-la-noun-pPiPS~mC", "links": [ [ "shrew", "shrew" ], [ "shrewmouse", "shrewmouse" ] ], "tags": [ "declension-3" ] }, { "categories": [ { "kind": "other", "name": "Late Latin", "parents": [], "source": "w" }, { "kind": "other", "name": "Medieval Latin", "parents": [], "source": "w" }, { "_dis": "46 54", "kind": "other", "name": "Latin entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "35 65", "kind": "other", "name": "Latin masculine nouns in the third declension", "parents": [], "source": "w+disamb" }, { "_dis": "46 54", "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w+disamb" }, { "_dis": "46 54", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "47 53", "kind": "lifeform", "langcode": "la", "name": "Rodents", "orig": "la:Rodents", "parents": [ "Mammals", "Vertebrates", "Chordates", "Animals", "Lifeforms", "All topics", "Life", "Fundamental", "Nature" ], "source": "w+disamb" }, { "_dis": "50 50", "kind": "lifeform", "langcode": "la", "name": "Soricomorphs", "orig": "la:Soricomorphs", "parents": [ "Mammals", "Vertebrates", "Chordates", "Animals", "Lifeforms", "All topics", "Life", "Fundamental", "Nature" ], "source": "w+disamb" } ], "glosses": [ "mouse" ], "id": "en-sorex-la-noun-R8XCjK4l", "links": [ [ "mouse", "mouse" ] ], "raw_glosses": [ "(Late Latin, Medieval Latin) mouse" ], "tags": [ "Late-Latin", "Medieval-Latin", "declension-3" ] } ], "sounds": [ { "ipa": "/ˈsoː.reks/", "tags": [ "Classical-Latin" ] }, { "ipa": "[ˈs̠oːrɛks̠]", "tags": [ "Classical-Latin" ] }, { "ipa": "/ˈso.reks/", "note": "modern Italianate Ecclesiastical" }, { "ipa": "[ˈsɔːreks]", "note": "modern Italianate Ecclesiastical" }, { "ipa": "/ˈso.reks/", "tags": [ "Classical-Latin" ] }, { "ipa": "[ˈs̠ɔrɛks̠]", "tags": [ "Classical-Latin" ] }, { "ipa": "/ˈso.reks/", "note": "modern Italianate Ecclesiastical" }, { "ipa": "[ˈsɔːreks]", "note": "modern Italianate Ecclesiastical" } ], "word": "sorex" }
{ "categories": [ "Latin 2-syllable words", "Latin entries with incorrect language header", "Latin lemmas", "Latin masculine nouns", "Latin masculine nouns in the third declension", "Latin nouns", "Latin terms derived from Ancient Greek", "Latin terms with IPA pronunciation", "Latin terms with unknown etymologies", "Latin third declension nouns", "Pages with 1 entry", "Pages with entries", "la:Rodents", "la:Soricomorphs" ], "derived": [ { "word": "sōricīnus" } ], "descendants": [ { "depth": 1, "templates": [], "text": "Balkan Romance:" }, { "depth": 2, "templates": [ { "args": { "1": "rup", "2": "shoaric", "3": "shorãc" }, "expansion": "Aromanian: shoaric, shorãc", "name": "desc" } ], "text": "Aromanian: shoaric, shorãc" }, { "depth": 2, "templates": [ { "args": { "1": "ro", "2": "șoarece", "3": "șoarec" }, "expansion": "Romanian: șoarece, șoarec", "name": "desc" } ], "text": "Romanian: șoarece, șoarec" }, { "depth": 1, "templates": [], "text": "Dalmatian:" }, { "depth": 2, "templates": [ { "args": { "1": "dlm", "2": "surco", "nolb": "1" }, "expansion": "surco", "name": "desc" } ], "text": "surco" }, { "depth": 1, "templates": [], "text": "Italo-Romance:" }, { "depth": 2, "templates": [ { "args": { "1": "it", "2": "sorcio", "3": "sorice" }, "expansion": "Italian: sorcio, sorice", "name": "desc" }, { "args": { "1": "archaic" }, "expansion": "(archaic)", "name": "q" }, { "args": { "1": "Marche" }, "expansion": "(Marche)", "name": "q" } ], "text": "Italian: sorcio, sorice (archaic), sorca, sorga (Marche)" }, { "depth": 2, "templates": [ { "args": { "1": "nap", "2": "sorece" }, "expansion": "Neapolitan: sorece", "name": "desc" } ], "text": "Neapolitan: sorece" }, { "depth": 2, "templates": [ { "args": { "1": "scn", "2": "surci", "3": "sùrici" }, "expansion": "Sicilian: surci, sùrici", "name": "desc" } ], "text": "Sicilian: surci, sùrici" }, { "depth": 1, "templates": [], "text": "North Italian:" }, { "depth": 2, "templates": [ { "args": { "1": "fur", "2": "surîs" }, "expansion": "Friulian: surîs", "name": "desc" } ], "text": "Friulian: surîs" }, { "depth": 2, "templates": [ { "args": { "1": "lmo", "2": "sorec" }, "expansion": "Lombard: sorec", "name": "desc" } ], "text": "Lombard: sorec" }, { "depth": 2, "templates": [ { "args": { "1": "rm", "2": "schuorsch" }, "expansion": "Romansch: schuorsch", "name": "desc" } ], "text": "Romansch: schuorsch" }, { "depth": 2, "templates": [ { "args": { "1": "vec", "2": "sorxe" }, "expansion": "Venetan: sorxe", "name": "desc" } ], "text": "Venetan: sorxe" }, { "depth": 1, "templates": [], "text": "Gallo-Romance:" }, { "depth": 2, "templates": [ { "args": { "1": "fro", "2": "soris" }, "expansion": "Old French: soris", "name": "desc" } ], "text": "Old French: soris" }, { "depth": 3, "templates": [ { "args": { "1": "fr", "2": "souris" }, "expansion": "French: souris\nMichif: soorii", "name": "desctree" } ], "text": "French: souris\nMichif: soorii" }, { "depth": 3, "templates": [ { "args": { "1": "nrf", "2": "souoris" }, "expansion": "Norman: souoris", "name": "desc" } ], "text": "Norman: souoris" }, { "depth": 3, "templates": [ { "args": { "1": "pcd" }, "expansion": "Picard:", "name": "desc" } ], "text": "Picard:" }, { "depth": 3, "templates": [ { "args": { "1": "pcd", "2": "suris", "nolb": "1" }, "expansion": "suris", "name": "desc" } ], "text": "Northern: suris" }, { "depth": 3, "templates": [ { "args": { "1": "pcd", "2": "seris", "3": "seuris", "4": "soiris", "nolb": "1" }, "expansion": "seris, seuris, soiris", "name": "desc" } ], "text": "Southern: seris, seuris, soiris" }, { "depth": 3, "templates": [ { "args": { "1": "roa-poi", "2": "sourit", "der": "1" }, "expansion": "⇒ Poitevin-Saintongeais: sourit", "name": "desc" } ], "text": "⇒ Poitevin-Saintongeais: sourit" }, { "depth": 3, "templates": [ { "args": { "1": "wa", "2": "soris" }, "expansion": "Walloon: soris", "name": "desc" } ], "text": "Walloon: soris" }, { "depth": 1, "templates": [], "text": "West Iberian:" }, { "depth": 2, "templates": [ { "args": { "1": "osp", "2": "sorze" }, "expansion": "Old Spanish: sorze", "name": "desc" } ], "text": "Old Spanish: sorze" }, { "depth": 3, "templates": [ { "args": { "1": "es", "2": "sorce" }, "expansion": "Spanish: sorce", "name": "desc" } ], "text": "Spanish: sorce" }, { "depth": 1, "templates": [], "text": "Insular Romance:" }, { "depth": 2, "templates": [ { "args": { "1": "sc" }, "expansion": "Sardinian:", "name": "desc" } ], "text": "Sardinian:" }, { "depth": 3, "templates": [ { "args": { "1": "sc-src", "2": "sorighe" }, "expansion": "Logudorese: sorighe", "name": "desc" } ], "text": "Logudorese: sorighe" }, { "depth": 3, "templates": [ { "args": { "1": "sc-nuo", "2": "soriche" }, "expansion": "Nuorese: soriche", "name": "desc" } ], "text": "Nuorese: soriche" }, { "depth": 1, "templates": [ { "args": { "1": "Sorex", "2": "genus" }, "expansion": "Sorex", "name": "taxfmt" } ], "text": "Translingual: Sorex" }, { "depth": 1, "templates": [], "text": "Various derived terms meaning 'bat':" }, { "depth": 2, "templates": [ { "args": { "1": "dlm", "2": "surca pizigaun", "3": "surca pitsigaun", "der": "1" }, "expansion": "⇒ Dalmatian: surca pizigaun, surca pitsigaun", "name": "desc" } ], "text": "⇒ Dalmatian: surca pizigaun, surca pitsigaun" }, { "depth": 2, "templates": [ { "args": { "1": "fr", "2": "chauvesouris", "der": "1" }, "expansion": "⇒ French: chauvesouris", "name": "desc" } ], "text": "⇒ French: chauvesouris" }, { "depth": 2, "templates": [ { "args": { "1": "oc", "2": "soritz pennada", "der": "1" }, "expansion": "⇒ Occitan: soritz pennada", "name": "desc" } ], "text": "⇒ Occitan: soritz pennada" }, { "depth": 2, "templates": [ { "args": { "1": "sc", "2": "sorighe pinnadulu", "der": "1" }, "expansion": "⇒ Sardinian: sorighe pinnadulu", "name": "desc" } ], "text": "⇒ Sardinian: sorighe pinnadulu" }, { "depth": 2, "templates": [ { "args": { "1": "scn", "2": "suriğe ulateu", "3": "sorici occelli", "der": "1" }, "expansion": "⇒ Sicilian: suriğe ulateu, sorici occelli", "name": "desc" }, { "args": { "1": "Calabria" }, "expansion": "(Calabria)", "name": "q" } ], "text": "⇒ Sicilian: suriğe ulateu, sorici occelli (Calabria)" } ], "etymology_templates": [ { "args": { "1": "la" }, "expansion": "Uncertain", "name": "unc" }, { "args": { "1": "la", "2": "grc", "3": "ὕραξ", "4": "", "5": "shrewmouse" }, "expansion": "Ancient Greek ὕραξ (húrax, “shrewmouse”)", "name": "der" } ], "etymology_text": "Uncertain; possibly related to susurrus (“whisper, rustling”), or Ancient Greek ὕραξ (húrax, “shrewmouse”).", "forms": [ { "form": "sōrex", "tags": [ "canonical", "masculine" ] }, { "form": "sōricis", "tags": [ "genitive" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "la-ndecl", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "sōrex", "source": "declension", "tags": [ "nominative", "singular" ] }, { "form": "sōricēs", "source": "declension", "tags": [ "nominative", "plural" ] }, { "form": "sōricis", "source": "declension", "tags": [ "genitive", "singular" ] }, { "form": "sōricum", "source": "declension", "tags": [ "genitive", "plural" ] }, { "form": "sōricī", "source": "declension", "tags": [ "dative", "singular" ] }, { "form": "sōricibus", "source": "declension", "tags": [ "dative", "plural" ] }, { "form": "sōricem", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "sōricēs", "source": "declension", "tags": [ "accusative", "plural" ] }, { "form": "sōrice", "source": "declension", "tags": [ "ablative", "singular" ] }, { "form": "sōricibus", "source": "declension", "tags": [ "ablative", "plural" ] }, { "form": "sōrex", "source": "declension", "tags": [ "singular", "vocative" ] }, { "form": "sōricēs", "source": "declension", "tags": [ "plural", "vocative" ] } ], "head_templates": [ { "args": { "1": "sōrex<3>", "g": "m" }, "expansion": "sōrex m (genitive sōricis); third declension", "name": "la-noun" } ], "inflection_templates": [ { "args": { "1": "sōrex<3>" }, "name": "la-ndecl" } ], "lang": "Latin", "lang_code": "la", "pos": "noun", "senses": [ { "glosses": [ "shrew, shrewmouse" ], "links": [ [ "shrew", "shrew" ], [ "shrewmouse", "shrewmouse" ] ], "tags": [ "declension-3" ] }, { "categories": [ "Late Latin", "Medieval Latin" ], "glosses": [ "mouse" ], "links": [ [ "mouse", "mouse" ] ], "raw_glosses": [ "(Late Latin, Medieval Latin) mouse" ], "tags": [ "Late-Latin", "Medieval-Latin", "declension-3" ] } ], "sounds": [ { "ipa": "/ˈsoː.reks/", "tags": [ "Classical-Latin" ] }, { "ipa": "[ˈs̠oːrɛks̠]", "tags": [ "Classical-Latin" ] }, { "ipa": "/ˈso.reks/", "note": "modern Italianate Ecclesiastical" }, { "ipa": "[ˈsɔːreks]", "note": "modern Italianate Ecclesiastical" }, { "ipa": "/ˈso.reks/", "tags": [ "Classical-Latin" ] }, { "ipa": "[ˈs̠ɔrɛks̠]", "tags": [ "Classical-Latin" ] }, { "ipa": "/ˈso.reks/", "note": "modern Italianate Ecclesiastical" }, { "ipa": "[ˈsɔːreks]", "note": "modern Italianate Ecclesiastical" } ], "word": "sorex" }
Download raw JSONL data for sorex meaning in Latin (8.5kB)
This page is a part of the kaikki.org machine-readable Latin dictionary. This dictionary is based on structured data extracted on 2024-12-21 from the enwiktionary dump dated 2024-12-04 using wiktextract (d8cb2f3 and 4e554ae). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.