See sarïmsak in All languages combined, or Wiktionary
{ "descendants": [ { "depth": 1, "templates": [ { "args": { "1": "xqa", "2": "سَرْمُسَقْ", "3": "سَرُمْسَقْ", "4": "سَمُرْسَقْ", "tr": "sarmusaq", "tr2": "sarumsaq", "tr3": "samursaq" }, "expansion": "Karakhanid: سَرْمُسَقْ (sarmusaq), سَرُمْسَقْ (sarumsaq), سَمُرْسَقْ (samursaq)", "name": "desc" } ], "text": "Karakhanid: سَرْمُسَقْ (sarmusaq), سَرُمْسَقْ (sarumsaq), سَمُرْسَقْ (samursaq)" }, { "depth": 1, "templates": [], "text": "Oghuz" }, { "depth": 2, "templates": [], "text": "West Oghuz" }, { "depth": 3, "templates": [ { "args": { "1": "az", "2": "sarımsaq" }, "expansion": "Azerbaijani: sarımsaq", "name": "desc" } ], "text": "Azerbaijani: sarımsaq" }, { "depth": 3, "templates": [ { "args": { "1": "gag", "2": "sarmısak" }, "expansion": "Gagauz: sarmısak", "name": "desc" } ], "text": "Gagauz: sarmısak" }, { "depth": 3, "templates": [ { "args": { "1": "ota", "2": "صارمساق", "tr": "sarımsaq" }, "expansion": "Ottoman Turkish: صارمساق (sarımsaq)", "name": "desc" } ], "text": "Ottoman Turkish: صارمساق (sarımsaq)" }, { "depth": 4, "templates": [ { "args": { "1": "tr", "2": "sarmısak", "3": "sarımsak", "4": "samırsak" }, "expansion": "Turkish: sarmısak, sarımsak, samırsak", "name": "desc" } ], "text": "Turkish: sarmısak, sarımsak, samırsak" }, { "depth": 2, "templates": [], "text": "East Oghuz" }, { "depth": 3, "templates": [ { "args": { "1": "tk", "2": "sarymsak" }, "expansion": "Turkmen: sarymsak", "name": "desc" } ], "text": "Turkmen: sarymsak" }, { "depth": 1, "templates": [], "text": "Kipchak" }, { "depth": 2, "templates": [], "text": "West Kipchak" }, { "depth": 3, "templates": [ { "args": { "1": "krc", "2": "сарсмакъ", "3": "сарымсах", "tr": "sarsmaq", "tr2": "sarımsax" }, "expansion": "Karachay-Balkar: сарсмакъ (sarsmaq), сарымсах (sarımsax)", "name": "desc" } ], "text": "Karachay-Balkar: сарсмакъ (sarsmaq), сарымсах (sarımsax)" }, { "depth": 3, "templates": [ { "args": { "1": "kum", "2": "самурсакъ", "tr": "samursaq" }, "expansion": "Kumyk: самурсакъ (samursaq)", "name": "desc" } ], "text": "Kumyk: самурсакъ (samursaq)" }, { "depth": 2, "templates": [], "text": "North Kipchak" }, { "depth": 3, "templates": [ { "args": { "1": "ba", "2": "һарымһаҡ" }, "expansion": "Bashkir: һарымһаҡ (harımhaq)", "name": "desc" } ], "text": "Bashkir: һарымһаҡ (harımhaq)" }, { "depth": 3, "templates": [ { "args": { "1": "tt", "2": "сарымсак" }, "expansion": "Tatar: сарымсак (sarımsaq)", "name": "desc" } ], "text": "Tatar: сарымсак (sarımsaq)" }, { "depth": 2, "templates": [], "text": "South Kipchak" }, { "depth": 3, "templates": [], "text": "Caspian" }, { "depth": 4, "templates": [ { "args": { "1": "kk", "2": "сарымсақ" }, "expansion": "Kazakh: сарымсақ (sarymsaq)", "name": "desc" } ], "text": "Kazakh: сарымсақ (sarymsaq)" }, { "depth": 4, "templates": [], "text": "Karakalpak sarımsaq" }, { "depth": 3, "templates": [], "text": "Kyrgyz-Kipchak" }, { "depth": 4, "templates": [ { "args": { "1": "ky", "2": "сарымсак" }, "expansion": "Kyrgyz: сарымсак (sarımsak)", "name": "desc" } ], "text": "Kyrgyz: сарымсак (sarımsak)" }, { "depth": 4, "templates": [ { "args": { "1": "alt", "2": "сарымсак" }, "expansion": "Southern Altai: сарымсак (sarïmsak)", "name": "desc" } ], "text": "Southern Altai: сарымсак (sarïmsak) (dialectal)" }, { "depth": 1, "templates": [], "text": "Karluk:" }, { "depth": 2, "templates": [ { "args": { "1": "chg", "2": "ساریمساق", "tr": "sarımsaq" }, "expansion": "Chagatai: ساریمساق (sarımsaq)", "name": "desc" } ], "text": "Chagatai: ساریمساق (sarımsaq)" }, { "depth": 3, "templates": [ { "args": { "1": "uz", "2": "sarimsoq" }, "expansion": "Uzbek: sarimsoq", "name": "desc" } ], "text": "Uzbek: sarimsoq" }, { "depth": 3, "templates": [ { "args": { "1": "ug", "2": "سامساق" }, "expansion": "Uyghur: سامساق (samsaq)", "name": "desc" } ], "text": "Uyghur: سامساق (samsaq)" }, { "depth": 1, "templates": [ { "args": { "1": "xgn-pro", "2": "*sarïmsag", "bor": "1" }, "expansion": "→ Proto-Mongolic: *sarïmsag", "name": "desc" } ], "text": "→ Proto-Mongolic: *sarïmsag" }, { "depth": 2, "templates": [ { "args": { "1": "sce", "2": "samusa" }, "expansion": "Dongxiang: samusa", "name": "desc" } ], "text": "Dongxiang: samusa" }, { "depth": 2, "templates": [ { "args": { "1": "mn", "2": "сармис", "alts": "1" }, "expansion": "Mongolian: сармис (sarmis), саримсаг (sarimsag), саримс (sarims)", "name": "desc" } ], "text": "Mongolian: сармис (sarmis), саримсаг (sarimsag), саримс (sarims)" } ], "etymology_templates": [ { "args": { "1": "trk-pro", "2": "ira" }, "expansion": "Iranian", "name": "bor" }, { "args": { "1": "cv", "2": "-" }, "expansion": "Chuvash", "name": "cog" }, { "args": { "1": "trk-sib", "2": "-" }, "expansion": "Siberian Turkic", "name": "cog" }, { "args": { "1": "fa", "2": "سیرمو", "tr": "sirmu" }, "expansion": "Persian سیرمو (sirmu)", "name": "cog" }, { "args": { "1": "kho", "tr": "sarme" }, "expansion": "Khotanese [script needed] (sarme)", "name": "cog" }, { "args": { "1": "sla-pro", "2": "*čermъša", "t": "ramsons" }, "expansion": "Proto-Slavic *čermъša (“ramsons”)", "name": "cog" }, { "args": { "1": "lt", "2": "kermùšė", "t": "ramsons" }, "expansion": "Lithuanian kermùšė (“ramsons”)", "name": "cog" }, { "args": { "1": "grc", "2": "κρόμμυον" }, "expansion": "Ancient Greek κρόμμυον (krómmuon)", "name": "cog" }, { "args": { "1": "gmw-pro", "2": "*hramusō", "t": "ramson" }, "expansion": "Proto-West Germanic *hramusō (“ramson”)", "name": "cog" }, { "args": { "1": "sga", "2": "crem", "t": "ramson" }, "expansion": "Old Irish crem (“ramson”)", "name": "cog" }, { "args": { "1": "ga", "2": "creamh" }, "expansion": "Irish creamh", "name": "cog" }, { "args": { "1": "xco", "tr": "-cyk" }, "expansion": "Khwarezmian [script needed] (-cyk)", "name": "cog" }, { "args": { "1": "sog", "tr": "-cyq" }, "expansion": "Sogdian [script needed] (-cyq)", "name": "cog" }, { "args": { "1": "hu", "2": "sárma" }, "expansion": "Hungarian sárma", "name": "cog" }, { "args": { "1": "hu", "2": "xln", "3": "-", "nocat": "1" }, "expansion": "Alanic", "name": "der" }, { "args": { "1": "trk", "2": "-" }, "expansion": "Turkic", "name": "cog" } ], "etymology_text": "Initially held to be derived from sarım (\"winding\"), which was later found phonetically and morphologically problematic. Another theory conceptualizes it after its yellowish-white root as a sarımsı (“yellowish, whitish” < sarı \"yellow\", from Proto-Turkic *sāryg (“yellow”), derived from the root *siar(ï)- originally preserving the primary meaning ‘white’ in Chuvash as шурӑ {šură}.\nAlternatively borrowed from Iranian, with the argument of the absence in Chuvash and Siberian Turkic. Found in Persian سیرمو (sirmu), سیر (sir, “garlic”), Khotanese [script needed] (sarme), [script needed] (sarmā, an eaten bulb of uncertain identification), doubtfully further connected to Proto-Slavic *čermъša (“ramsons”), Lithuanian kermùšė (“ramsons”), Ancient Greek κρόμμυον (krómmuon), Proto-West Germanic *hramusō (“ramson”), Old Irish crem (“ramson”) (Irish creamh). The suffix -sak (compare: -cik) of the Turkic word is depicted by Khwarezmian [script needed] (-cyk), Sogdian [script needed] (-cyq) that form the nisba adjective and noun. This suffix is recently held to be derived from the native form s(ı) + Old Turkic participle suffix ak or ç + diminutive suffix ak.\nHungarian sárma, meaning Ornithogalum species, which is of the same botanical order as garlic, is either an Alanic or a Turkic borrowing, observing also that in Turkic words which otherwise denote the garlic are used for Ornithogalum.", "forms": [ { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "trk-pro-decl-noun", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "sarïmsak", "source": "declension", "tags": [ "nominative", "singular" ] }, { "form": "sarïmsakïg", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "sarïmsaknï", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "sarïmsaknïŋ", "source": "declension", "tags": [ "genitive", "singular" ] }, { "form": "sarïmsakka", "source": "declension", "tags": [ "dative", "singular" ] }, { "form": "sarïmsakda", "source": "declension", "tags": [ "locative", "singular" ] }, { "form": "sarïmsakdan", "source": "declension", "tags": [ "ablative", "singular" ] }, { "form": "sarïmsakgaru", "source": "declension", "tags": [ "allative", "singular" ] }, { "form": "sarïmsakïn", "source": "declension", "tags": [ "instrumental", "singular" ] }, { "form": "sarïmsakča", "source": "declension", "tags": [ "equative", "singular" ] }, { "form": "sarïmsaklayu", "source": "declension", "tags": [ "error-unrecognized-form", "singular" ] }, { "form": "sarïmsaklïgu", "source": "declension", "tags": [ "comitative", "singular" ] } ], "head_templates": [ { "args": { "1": "trk-pro", "2": "noun" }, "expansion": "*sarïmsak", "name": "head" } ], "inflection_templates": [ { "args": { "1": "a" }, "name": "trk-pro-decl-noun" } ], "lang": "Proto-Turkic", "lang_code": "trk-pro", "original_title": "Reconstruction:Proto-Turkic/sarïmsak", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Proto-Turkic entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" } ], "glosses": [ "garlic" ], "id": "en-sarïmsak-trk-pro-noun-QQJAhNLi", "links": [ [ "garlic", "garlic" ] ], "tags": [ "reconstruction" ] } ], "word": "sarïmsak" }
{ "descendants": [ { "depth": 1, "templates": [ { "args": { "1": "xqa", "2": "سَرْمُسَقْ", "3": "سَرُمْسَقْ", "4": "سَمُرْسَقْ", "tr": "sarmusaq", "tr2": "sarumsaq", "tr3": "samursaq" }, "expansion": "Karakhanid: سَرْمُسَقْ (sarmusaq), سَرُمْسَقْ (sarumsaq), سَمُرْسَقْ (samursaq)", "name": "desc" } ], "text": "Karakhanid: سَرْمُسَقْ (sarmusaq), سَرُمْسَقْ (sarumsaq), سَمُرْسَقْ (samursaq)" }, { "depth": 1, "templates": [], "text": "Oghuz" }, { "depth": 2, "templates": [], "text": "West Oghuz" }, { "depth": 3, "templates": [ { "args": { "1": "az", "2": "sarımsaq" }, "expansion": "Azerbaijani: sarımsaq", "name": "desc" } ], "text": "Azerbaijani: sarımsaq" }, { "depth": 3, "templates": [ { "args": { "1": "gag", "2": "sarmısak" }, "expansion": "Gagauz: sarmısak", "name": "desc" } ], "text": "Gagauz: sarmısak" }, { "depth": 3, "templates": [ { "args": { "1": "ota", "2": "صارمساق", "tr": "sarımsaq" }, "expansion": "Ottoman Turkish: صارمساق (sarımsaq)", "name": "desc" } ], "text": "Ottoman Turkish: صارمساق (sarımsaq)" }, { "depth": 4, "templates": [ { "args": { "1": "tr", "2": "sarmısak", "3": "sarımsak", "4": "samırsak" }, "expansion": "Turkish: sarmısak, sarımsak, samırsak", "name": "desc" } ], "text": "Turkish: sarmısak, sarımsak, samırsak" }, { "depth": 2, "templates": [], "text": "East Oghuz" }, { "depth": 3, "templates": [ { "args": { "1": "tk", "2": "sarymsak" }, "expansion": "Turkmen: sarymsak", "name": "desc" } ], "text": "Turkmen: sarymsak" }, { "depth": 1, "templates": [], "text": "Kipchak" }, { "depth": 2, "templates": [], "text": "West Kipchak" }, { "depth": 3, "templates": [ { "args": { "1": "krc", "2": "сарсмакъ", "3": "сарымсах", "tr": "sarsmaq", "tr2": "sarımsax" }, "expansion": "Karachay-Balkar: сарсмакъ (sarsmaq), сарымсах (sarımsax)", "name": "desc" } ], "text": "Karachay-Balkar: сарсмакъ (sarsmaq), сарымсах (sarımsax)" }, { "depth": 3, "templates": [ { "args": { "1": "kum", "2": "самурсакъ", "tr": "samursaq" }, "expansion": "Kumyk: самурсакъ (samursaq)", "name": "desc" } ], "text": "Kumyk: самурсакъ (samursaq)" }, { "depth": 2, "templates": [], "text": "North Kipchak" }, { "depth": 3, "templates": [ { "args": { "1": "ba", "2": "һарымһаҡ" }, "expansion": "Bashkir: һарымһаҡ (harımhaq)", "name": "desc" } ], "text": "Bashkir: һарымһаҡ (harımhaq)" }, { "depth": 3, "templates": [ { "args": { "1": "tt", "2": "сарымсак" }, "expansion": "Tatar: сарымсак (sarımsaq)", "name": "desc" } ], "text": "Tatar: сарымсак (sarımsaq)" }, { "depth": 2, "templates": [], "text": "South Kipchak" }, { "depth": 3, "templates": [], "text": "Caspian" }, { "depth": 4, "templates": [ { "args": { "1": "kk", "2": "сарымсақ" }, "expansion": "Kazakh: сарымсақ (sarymsaq)", "name": "desc" } ], "text": "Kazakh: сарымсақ (sarymsaq)" }, { "depth": 4, "templates": [], "text": "Karakalpak sarımsaq" }, { "depth": 3, "templates": [], "text": "Kyrgyz-Kipchak" }, { "depth": 4, "templates": [ { "args": { "1": "ky", "2": "сарымсак" }, "expansion": "Kyrgyz: сарымсак (sarımsak)", "name": "desc" } ], "text": "Kyrgyz: сарымсак (sarımsak)" }, { "depth": 4, "templates": [ { "args": { "1": "alt", "2": "сарымсак" }, "expansion": "Southern Altai: сарымсак (sarïmsak)", "name": "desc" } ], "text": "Southern Altai: сарымсак (sarïmsak) (dialectal)" }, { "depth": 1, "templates": [], "text": "Karluk:" }, { "depth": 2, "templates": [ { "args": { "1": "chg", "2": "ساریمساق", "tr": "sarımsaq" }, "expansion": "Chagatai: ساریمساق (sarımsaq)", "name": "desc" } ], "text": "Chagatai: ساریمساق (sarımsaq)" }, { "depth": 3, "templates": [ { "args": { "1": "uz", "2": "sarimsoq" }, "expansion": "Uzbek: sarimsoq", "name": "desc" } ], "text": "Uzbek: sarimsoq" }, { "depth": 3, "templates": [ { "args": { "1": "ug", "2": "سامساق" }, "expansion": "Uyghur: سامساق (samsaq)", "name": "desc" } ], "text": "Uyghur: سامساق (samsaq)" }, { "depth": 1, "templates": [ { "args": { "1": "xgn-pro", "2": "*sarïmsag", "bor": "1" }, "expansion": "→ Proto-Mongolic: *sarïmsag", "name": "desc" } ], "text": "→ Proto-Mongolic: *sarïmsag" }, { "depth": 2, "templates": [ { "args": { "1": "sce", "2": "samusa" }, "expansion": "Dongxiang: samusa", "name": "desc" } ], "text": "Dongxiang: samusa" }, { "depth": 2, "templates": [ { "args": { "1": "mn", "2": "сармис", "alts": "1" }, "expansion": "Mongolian: сармис (sarmis), саримсаг (sarimsag), саримс (sarims)", "name": "desc" } ], "text": "Mongolian: сармис (sarmis), саримсаг (sarimsag), саримс (sarims)" } ], "etymology_templates": [ { "args": { "1": "trk-pro", "2": "ira" }, "expansion": "Iranian", "name": "bor" }, { "args": { "1": "cv", "2": "-" }, "expansion": "Chuvash", "name": "cog" }, { "args": { "1": "trk-sib", "2": "-" }, "expansion": "Siberian Turkic", "name": "cog" }, { "args": { "1": "fa", "2": "سیرمو", "tr": "sirmu" }, "expansion": "Persian سیرمو (sirmu)", "name": "cog" }, { "args": { "1": "kho", "tr": "sarme" }, "expansion": "Khotanese [script needed] (sarme)", "name": "cog" }, { "args": { "1": "sla-pro", "2": "*čermъša", "t": "ramsons" }, "expansion": "Proto-Slavic *čermъša (“ramsons”)", "name": "cog" }, { "args": { "1": "lt", "2": "kermùšė", "t": "ramsons" }, "expansion": "Lithuanian kermùšė (“ramsons”)", "name": "cog" }, { "args": { "1": "grc", "2": "κρόμμυον" }, "expansion": "Ancient Greek κρόμμυον (krómmuon)", "name": "cog" }, { "args": { "1": "gmw-pro", "2": "*hramusō", "t": "ramson" }, "expansion": "Proto-West Germanic *hramusō (“ramson”)", "name": "cog" }, { "args": { "1": "sga", "2": "crem", "t": "ramson" }, "expansion": "Old Irish crem (“ramson”)", "name": "cog" }, { "args": { "1": "ga", "2": "creamh" }, "expansion": "Irish creamh", "name": "cog" }, { "args": { "1": "xco", "tr": "-cyk" }, "expansion": "Khwarezmian [script needed] (-cyk)", "name": "cog" }, { "args": { "1": "sog", "tr": "-cyq" }, "expansion": "Sogdian [script needed] (-cyq)", "name": "cog" }, { "args": { "1": "hu", "2": "sárma" }, "expansion": "Hungarian sárma", "name": "cog" }, { "args": { "1": "hu", "2": "xln", "3": "-", "nocat": "1" }, "expansion": "Alanic", "name": "der" }, { "args": { "1": "trk", "2": "-" }, "expansion": "Turkic", "name": "cog" } ], "etymology_text": "Initially held to be derived from sarım (\"winding\"), which was later found phonetically and morphologically problematic. Another theory conceptualizes it after its yellowish-white root as a sarımsı (“yellowish, whitish” < sarı \"yellow\", from Proto-Turkic *sāryg (“yellow”), derived from the root *siar(ï)- originally preserving the primary meaning ‘white’ in Chuvash as шурӑ {šură}.\nAlternatively borrowed from Iranian, with the argument of the absence in Chuvash and Siberian Turkic. Found in Persian سیرمو (sirmu), سیر (sir, “garlic”), Khotanese [script needed] (sarme), [script needed] (sarmā, an eaten bulb of uncertain identification), doubtfully further connected to Proto-Slavic *čermъša (“ramsons”), Lithuanian kermùšė (“ramsons”), Ancient Greek κρόμμυον (krómmuon), Proto-West Germanic *hramusō (“ramson”), Old Irish crem (“ramson”) (Irish creamh). The suffix -sak (compare: -cik) of the Turkic word is depicted by Khwarezmian [script needed] (-cyk), Sogdian [script needed] (-cyq) that form the nisba adjective and noun. This suffix is recently held to be derived from the native form s(ı) + Old Turkic participle suffix ak or ç + diminutive suffix ak.\nHungarian sárma, meaning Ornithogalum species, which is of the same botanical order as garlic, is either an Alanic or a Turkic borrowing, observing also that in Turkic words which otherwise denote the garlic are used for Ornithogalum.", "forms": [ { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "trk-pro-decl-noun", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "sarïmsak", "source": "declension", "tags": [ "nominative", "singular" ] }, { "form": "sarïmsakïg", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "sarïmsaknï", "source": "declension", "tags": [ "accusative", "singular" ] }, { "form": "sarïmsaknïŋ", "source": "declension", "tags": [ "genitive", "singular" ] }, { "form": "sarïmsakka", "source": "declension", "tags": [ "dative", "singular" ] }, { "form": "sarïmsakda", "source": "declension", "tags": [ "locative", "singular" ] }, { "form": "sarïmsakdan", "source": "declension", "tags": [ "ablative", "singular" ] }, { "form": "sarïmsakgaru", "source": "declension", "tags": [ "allative", "singular" ] }, { "form": "sarïmsakïn", "source": "declension", "tags": [ "instrumental", "singular" ] }, { "form": "sarïmsakča", "source": "declension", "tags": [ "equative", "singular" ] }, { "form": "sarïmsaklayu", "source": "declension", "tags": [ "error-unrecognized-form", "singular" ] }, { "form": "sarïmsaklïgu", "source": "declension", "tags": [ "comitative", "singular" ] } ], "head_templates": [ { "args": { "1": "trk-pro", "2": "noun" }, "expansion": "*sarïmsak", "name": "head" } ], "inflection_templates": [ { "args": { "1": "a" }, "name": "trk-pro-decl-noun" } ], "lang": "Proto-Turkic", "lang_code": "trk-pro", "original_title": "Reconstruction:Proto-Turkic/sarïmsak", "pos": "noun", "senses": [ { "categories": [ "Pages with 1 entry", "Pages with entries", "Proto-Turkic entries with incorrect language header", "Proto-Turkic lemmas", "Proto-Turkic nouns", "Proto-Turkic terms borrowed from Iranian languages", "Proto-Turkic terms derived from Iranian languages", "Requests for native script for Khotanese terms", "Requests for native script for Khwarezmian terms", "Requests for native script for Sogdian terms", "trk-pro:Asparagales order plants", "trk-pro:Vegetables" ], "glosses": [ "garlic" ], "links": [ [ "garlic", "garlic" ] ], "tags": [ "reconstruction" ] } ], "word": "sarïmsak" }
Download raw JSONL data for sarïmsak meaning in Proto-Turkic (9.7kB)
This page is a part of the kaikki.org machine-readable Proto-Turkic dictionary. This dictionary is based on structured data extracted on 2024-11-06 from the enwiktionary dump dated 2024-10-02 using wiktextract (fbeafe8 and 7f03c9b). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.