See Colombo in All languages combined, or Wiktionary
{ "etymology_number": 1, "etymology_templates": [ { "args": { "1": "en", "2": "pt", "3": "Colombo" }, "expansion": "Portuguese Colombo", "name": "bor" }, { "args": { "1": "en", "2": "si", "3": "කොලොන් තොට", "lit": "port on the river Kelani" }, "expansion": "Sinhalese කොලොන් තොට (kolon toṭa, literally “port on the river Kelani”)", "name": "der" }, { "args": { "1": "en", "2": "ved", "3": "-" }, "expansion": "Veddah", "name": "der" }, { "args": { "1": "w:Colombo#Etymology" }, "expansion": "w:Colombo § Etymology", "name": "section link" } ], "etymology_text": "From Portuguese Colombo, modification (under the influence of the Italian surname, see below) of Sinhalese කොලොන් තොට (kolon toṭa, literally “port on the river Kelani”). Other theories derive the name from Veddah; see w:Colombo § Etymology for more.", "head_templates": [ { "args": {}, "expansion": "Colombo", "name": "en-proper noun" } ], "lang": "English", "lang_code": "en", "pos": "name", "senses": [ { "categories": [ { "kind": "place", "langcode": "en", "name": "Cities in Sri Lanka", "orig": "en:Cities in Sri Lanka", "parents": [ "Cities", "Places", "Polities", "Names", "All topics", "Proper nouns", "Terms by semantic function", "Fundamental", "Nouns", "Lemmas" ], "source": "w" }, { "kind": "place", "langcode": "en", "name": "National capitals", "orig": "en:National capitals", "parents": [ "Capital cities", "Cities", "Polities", "Places", "Names", "All topics", "Proper nouns", "Terms by semantic function", "Fundamental", "Nouns", "Lemmas" ], "source": "w" }, { "kind": "place", "langcode": "en", "name": "Places in Sri Lanka", "orig": "en:Places in Sri Lanka", "parents": [ "Places", "Names", "All topics", "Proper nouns", "Terms by semantic function", "Fundamental", "Nouns", "Lemmas" ], "source": "w" }, { "_dis": "80 20", "kind": "other", "name": "English entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "kind": "other", "name": "Entries with translation boxes", "parents": [], "source": "w+disamb" }, { "_dis": "24 13 9 20 20 9 4", "kind": "other", "name": "Pages with 5 entries", "parents": [], "source": "w+disamb" }, { "_dis": "24 9 6 26 26 6 3", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Albanian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Amharic translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Arabic translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Armenian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Assamese translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Azerbaijani translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Belarusian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Bengali translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Bulgarian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Burmese translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Cantonese translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Czech translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Danish translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Dhivehi translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Dutch translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Esperanto translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Estonian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Finnish translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with French translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Georgian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with German translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Greek translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Gujarati translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Hebrew translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Hindi translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Hungarian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Icelandic translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Indonesian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Irish translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Italian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Japanese translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Kannada translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Kazakh translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Khmer translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Korean translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Kyrgyz translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Latvian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Lithuanian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Macedonian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Malay translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Malayalam translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Mandarin translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Marathi translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Mongolian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Nepali translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Northern Kurdish translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Norwegian Bokmål translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Norwegian Nynorsk translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Odia translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Pashto translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Persian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Polish translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Portuguese translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Punjabi translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Romanian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Russian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Serbo-Croatian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Sinhalese translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Slovak translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Slovene translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Spanish translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Swedish translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Tagalog translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Tajik translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Tamil translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Tatar translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Telugu translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Thai translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Tibetan translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Turkmen translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Ukrainian translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Urdu translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Uyghur translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Uzbek translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Vietnamese translations", "parents": [], "source": "w+disamb" }, { "kind": "other", "name": "Terms with Yiddish translations", "parents": [], "source": "w+disamb" } ], "examples": [ { "ref": "2022, Shehan Karunatilaka, The Seven Moons of Maali Almeida, Sort Of Books, page 266:", "text": "From this height, Colombo does not look like a mess. It sleeps in shadows decorated with trees and lights.", "type": "quote" } ], "glosses": [ "The commercial capital and largest city of Sri Lanka." ], "id": "en-Colombo-en-name-3I69yzuj", "links": [ [ "capital", "capital" ], [ "Sri Lanka", "Sri Lanka#English" ] ], "translations": [ { "code": "sq", "lang": "Albanian", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "am", "lang": "Amharic", "roman": "kolombo", "sense": "capital of Sri Lanka", "word": "ኮሎምቦ" }, { "code": "ar", "lang": "Arabic", "roman": "kolombō", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "كُولُومْبُو" }, { "code": "hy", "lang": "Armenian", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Կոլոմբո" }, { "code": "as", "lang": "Assamese", "roman": "kolombü", "sense": "capital of Sri Lanka", "word": "কলম্বো" }, { "code": "az", "lang": "Azerbaijani", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "be", "lang": "Belarusian", "roman": "Kalómba", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Кало́мба" }, { "code": "bn", "lang": "Bengali", "roman": "kolombō", "sense": "capital of Sri Lanka", "word": "কলম্বো" }, { "code": "bg", "lang": "Bulgarian", "roman": "Kolómbo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Коло́мбо" }, { "code": "my", "lang": "Burmese", "roman": "kuilambhui", "sense": "capital of Sri Lanka", "word": "ကိုလံဘို" }, { "code": "yue", "lang": "Chinese Cantonese", "sense": "capital of Sri Lanka", "word": "科倫坡" }, { "code": "yue", "lang": "Chinese Cantonese", "roman": "fo¹ leon⁴ bo¹", "sense": "capital of Sri Lanka", "word": "科伦坡" }, { "code": "cmn", "lang": "Chinese Mandarin", "sense": "capital of Sri Lanka", "word": "科倫坡" }, { "code": "cmn", "lang": "Chinese Mandarin", "roman": "Kēlúnpō", "sense": "capital of Sri Lanka", "word": "科伦坡" }, { "code": "cmn", "lang": "Chinese Mandarin", "sense": "capital of Sri Lanka", "word": "可倫坡" }, { "code": "cmn", "lang": "Chinese Mandarin", "roman": "Kělúnpō", "sense": "capital of Sri Lanka", "word": "可伦坡" }, { "code": "cs", "lang": "Czech", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Kolombo" }, { "code": "da", "lang": "Danish", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Colombo" }, { "code": "dv", "lang": "Dhivehi", "roman": "koḷuᵐbu", "sense": "capital of Sri Lanka", "word": "ކޮޅުނބު" }, { "code": "nl", "lang": "Dutch", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Colombo" }, { "code": "eo", "lang": "Esperanto", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "et", "lang": "Estonian", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "fi", "lang": "Finnish", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "fr", "lang": "French", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "Colombo" }, { "code": "ka", "lang": "Georgian", "roman": "ḳolombo", "sense": "capital of Sri Lanka", "word": "კოლომბო" }, { "code": "de", "lang": "German", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Colombo" }, { "code": "el", "lang": "Greek", "roman": "Kolómpo", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Κολόμπο" }, { "code": "gu", "lang": "Gujarati", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "કોલંબો" }, { "code": "he", "lang": "Hebrew", "roman": "kolómbo", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "קוֹלוֹמְבּוֹ" }, { "code": "hi", "lang": "Hindi", "roman": "kolambo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "कोलंबो" }, { "code": "hu", "lang": "Hungarian", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "is", "lang": "Icelandic", "sense": "capital of Sri Lanka", "word": "Kólombó" }, { "code": "id", "lang": "Indonesian", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "ga", "lang": "Irish", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "it", "lang": "Italian", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "Colombo" }, { "code": "ja", "lang": "Japanese", "roman": "Koronbo", "sense": "capital of Sri Lanka", "word": "コロンボ" }, { "code": "kn", "lang": "Kannada", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "ಕೊಲಂಬೊ" }, { "code": "kk", "lang": "Kazakh", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "km", "lang": "Khmer", "roman": "koulombou", "sense": "capital of Sri Lanka", "word": "កូឡុំបូ" }, { "code": "ko", "lang": "Korean", "roman": "Kollombo", "sense": "capital of Sri Lanka", "word": "콜롬보" }, { "code": "kmr", "lang": "Northern Kurdish", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "ky", "lang": "Kyrgyz", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "lv", "lang": "Latvian", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "lt", "lang": "Lithuanian", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Kolombas" }, { "code": "mk", "lang": "Macedonian", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "ms", "lang": "Malay", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "ml", "lang": "Malayalam", "roman": "koḷambō", "sense": "capital of Sri Lanka", "word": "കൊളംബോ" }, { "code": "mr", "lang": "Marathi", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "कोलंबो" }, { "code": "mn", "lang": "Mongolian", "roman": "Kolombo", "sense": "capital of Sri Lanka", "tags": [ "Cyrillic" ], "word": "Коломбо" }, { "code": "ne", "lang": "Nepali", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "कोलम्बो" }, { "code": "nb", "lang": "Norwegian Bokmål", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "nn", "lang": "Norwegian Nynorsk", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "or", "lang": "Odia", "roman": "kalombo", "sense": "capital of Sri Lanka", "word": "କଲୋମ୍ବୋ" }, { "code": "ps", "lang": "Pashto", "roman": "kolāmbó", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "کولمبو" }, { "code": "fa", "lang": "Persian", "roman": "kolombo", "sense": "capital of Sri Lanka", "word": "کلمبو" }, { "code": "pl", "lang": "Polish", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Kolombo" }, { "code": "pt", "lang": "Portuguese", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "Colombo" }, { "code": "pa", "lang": "Punjabi", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "ਕੋਲੰਬੋ" }, { "code": "ro", "lang": "Romanian", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "ru", "lang": "Russian", "roman": "Kolómbo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Коло́мбо" }, { "code": "sh", "lang": "Serbo-Croatian", "sense": "capital of Sri Lanka", "tags": [ "Cyrillic", "masculine" ], "word": "Коломбо" }, { "code": "sh", "lang": "Serbo-Croatian", "sense": "capital of Sri Lanka", "tags": [ "Roman", "masculine" ], "word": "Kolombo" }, { "code": "si", "lang": "Sinhalese", "roman": "koḷaᵐba", "sense": "capital of Sri Lanka", "word": "කොළඹ" }, { "code": "sk", "lang": "Slovak", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Kolombo" }, { "code": "sl", "lang": "Slovene", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Kolombo" }, { "code": "es", "lang": "Spanish", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Colombo" }, { "code": "sv", "lang": "Swedish", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Colombo" }, { "code": "tl", "lang": "Tagalog", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "tg", "lang": "Tajik", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "ta", "lang": "Tamil", "roman": "koḻumpu", "sense": "capital of Sri Lanka", "word": "கொழும்பு" }, { "code": "tt", "lang": "Tatar", "roman": "Qolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "te", "lang": "Telugu", "roman": "kolambō", "sense": "capital of Sri Lanka", "word": "కొలంబో" }, { "code": "th", "lang": "Thai", "roman": "koo-lam-boo", "sense": "capital of Sri Lanka", "word": "โคลัมโบ" }, { "code": "bo", "lang": "Tibetan", "roman": "kho lum po", "sense": "capital of Sri Lanka", "word": "ཁོ་ལུམ་པོ" }, { "code": "tk", "lang": "Turkmen", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "uk", "lang": "Ukrainian", "roman": "Kolómbo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Коло́мбо" }, { "code": "ur", "lang": "Urdu", "roman": "kolambo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "کولمبو" }, { "code": "ug", "lang": "Uyghur", "roman": "kolombo", "sense": "capital of Sri Lanka", "word": "كولومبو" }, { "code": "uz", "lang": "Uzbek", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "vi", "lang": "Vietnamese", "sense": "capital of Sri Lanka", "word": "Cô-lôm-bô" }, { "code": "yi", "lang": "Yiddish", "roman": "kolombo", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "קאָלאָמבאָ" } ] } ], "sounds": [ { "ipa": "/kəˈlɒm.bəʊ/", "tags": [ "UK" ] }, { "ipa": "/kəˈlʌm.bəʊ/", "tags": [ "UK" ] }, { "ipa": "/ˈkɒl.əm.bəʊ/", "tags": [ "UK", "also" ], "topics": [ "city", "cities", "region", "location" ] }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/47/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/47/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav.ogg" }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo2.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/5/5b/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/5/5b/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav.ogg" }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo3.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/4b/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/4b/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav.ogg" }, { "rhymes": "-ʌmbəʊ" } ], "wikipedia": [ "Colombo" ], "word": "Colombo" } { "etymology_number": 2, "etymology_templates": [ { "args": { "1": "en", "2": "it", "3": "Colombo" }, "expansion": "Italian Colombo", "name": "bor" } ], "etymology_text": "From Italian Colombo, from colombo (“pigeon, dove”).", "head_templates": [ { "args": {}, "expansion": "Colombo", "name": "en-proper noun" } ], "lang": "English", "lang_code": "en", "pos": "name", "senses": [ { "categories": [ { "kind": "other", "name": "English surnames", "parents": [], "source": "w" }, { "_dis": "24 13 9 20 20 9 4", "kind": "other", "name": "Pages with 5 entries", "parents": [], "source": "w+disamb" } ], "glosses": [ "A surname from Italian." ], "id": "en-Colombo-en-name-rsy3jwmJ", "links": [ [ "surname", "surname" ] ] } ], "sounds": [ { "ipa": "/kəˈlɒm.bəʊ/", "tags": [ "UK" ] }, { "ipa": "/kəˈlʌm.bəʊ/", "tags": [ "UK" ] }, { "ipa": "/ˈkɒl.əm.bəʊ/", "tags": [ "UK", "also" ], "topics": [ "city", "cities", "region", "location" ] }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/47/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/47/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav.ogg" }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo2.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/5/5b/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/5/5b/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav.ogg" }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo3.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/4b/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/4b/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav.ogg" }, { "rhymes": "-ʌmbəʊ" } ], "wikipedia": [ "Colombo" ], "word": "Colombo" }
{ "categories": [ "English entries with incorrect language header", "English lemmas", "English proper nouns", "English terms borrowed from Italian", "English terms borrowed from Portuguese", "English terms derived from Italian", "English terms derived from Portuguese", "English terms derived from Sinhalese", "English terms derived from Veddah", "English uncountable nouns", "Entries with translation boxes", "Pages with 5 entries", "Pages with entries", "Rhymes:English/ʌmbəʊ", "Rhymes:English/ʌmbəʊ/3 syllables", "Terms with Albanian translations", "Terms with Amharic translations", "Terms with Arabic translations", "Terms with Armenian translations", "Terms with Assamese translations", "Terms with Azerbaijani translations", "Terms with Belarusian translations", "Terms with Bengali translations", "Terms with Bulgarian translations", "Terms with Burmese translations", "Terms with Cantonese translations", "Terms with Czech translations", "Terms with Danish translations", "Terms with Dhivehi translations", "Terms with Dutch translations", "Terms with Esperanto translations", "Terms with Estonian translations", "Terms with Finnish translations", "Terms with French translations", "Terms with Georgian translations", "Terms with German translations", "Terms with Greek translations", "Terms with Gujarati translations", "Terms with Hebrew translations", "Terms with Hindi translations", "Terms with Hungarian translations", "Terms with Icelandic translations", "Terms with Indonesian translations", "Terms with Irish translations", "Terms with Italian translations", "Terms with Japanese translations", "Terms with Kannada translations", "Terms with Kazakh translations", "Terms with Khmer translations", "Terms with Korean translations", "Terms with Kyrgyz translations", "Terms with Latvian translations", "Terms with Lithuanian translations", "Terms with Macedonian translations", "Terms with Malay translations", "Terms with Malayalam translations", "Terms with Mandarin translations", "Terms with Marathi translations", "Terms with Mongolian translations", "Terms with Nepali translations", "Terms with Northern Kurdish translations", "Terms with Norwegian Bokmål translations", "Terms with Norwegian Nynorsk translations", "Terms with Odia translations", "Terms with Pashto translations", "Terms with Persian translations", "Terms with Polish translations", "Terms with Portuguese translations", "Terms with Punjabi translations", "Terms with Romanian translations", "Terms with Russian translations", "Terms with Serbo-Croatian translations", "Terms with Sinhalese translations", "Terms with Slovak translations", "Terms with Slovene translations", "Terms with Spanish translations", "Terms with Swedish translations", "Terms with Tagalog translations", "Terms with Tajik translations", "Terms with Tamil translations", "Terms with Tatar translations", "Terms with Telugu translations", "Terms with Thai translations", "Terms with Tibetan translations", "Terms with Turkmen translations", "Terms with Ukrainian translations", "Terms with Urdu translations", "Terms with Uyghur translations", "Terms with Uzbek translations", "Terms with Vietnamese translations", "Terms with Yiddish translations" ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "en", "2": "pt", "3": "Colombo" }, "expansion": "Portuguese Colombo", "name": "bor" }, { "args": { "1": "en", "2": "si", "3": "කොලොන් තොට", "lit": "port on the river Kelani" }, "expansion": "Sinhalese කොලොන් තොට (kolon toṭa, literally “port on the river Kelani”)", "name": "der" }, { "args": { "1": "en", "2": "ved", "3": "-" }, "expansion": "Veddah", "name": "der" }, { "args": { "1": "w:Colombo#Etymology" }, "expansion": "w:Colombo § Etymology", "name": "section link" } ], "etymology_text": "From Portuguese Colombo, modification (under the influence of the Italian surname, see below) of Sinhalese කොලොන් තොට (kolon toṭa, literally “port on the river Kelani”). Other theories derive the name from Veddah; see w:Colombo § Etymology for more.", "head_templates": [ { "args": {}, "expansion": "Colombo", "name": "en-proper noun" } ], "lang": "English", "lang_code": "en", "pos": "name", "senses": [ { "categories": [ "English terms with quotations", "en:Cities in Sri Lanka", "en:National capitals", "en:Places in Sri Lanka" ], "examples": [ { "ref": "2022, Shehan Karunatilaka, The Seven Moons of Maali Almeida, Sort Of Books, page 266:", "text": "From this height, Colombo does not look like a mess. It sleeps in shadows decorated with trees and lights.", "type": "quote" } ], "glosses": [ "The commercial capital and largest city of Sri Lanka." ], "links": [ [ "capital", "capital" ], [ "Sri Lanka", "Sri Lanka#English" ] ] } ], "sounds": [ { "ipa": "/kəˈlɒm.bəʊ/", "tags": [ "UK" ] }, { "ipa": "/kəˈlʌm.bəʊ/", "tags": [ "UK" ] }, { "ipa": "/ˈkɒl.əm.bəʊ/", "tags": [ "UK", "also" ], "topics": [ "city", "cities", "region", "location" ] }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/47/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/47/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav.ogg" }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo2.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/5/5b/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/5/5b/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav.ogg" }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo3.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/4b/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/4b/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav.ogg" }, { "rhymes": "-ʌmbəʊ" } ], "translations": [ { "code": "sq", "lang": "Albanian", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "am", "lang": "Amharic", "roman": "kolombo", "sense": "capital of Sri Lanka", "word": "ኮሎምቦ" }, { "code": "ar", "lang": "Arabic", "roman": "kolombō", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "كُولُومْبُو" }, { "code": "hy", "lang": "Armenian", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Կոլոմբո" }, { "code": "as", "lang": "Assamese", "roman": "kolombü", "sense": "capital of Sri Lanka", "word": "কলম্বো" }, { "code": "az", "lang": "Azerbaijani", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "be", "lang": "Belarusian", "roman": "Kalómba", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Кало́мба" }, { "code": "bn", "lang": "Bengali", "roman": "kolombō", "sense": "capital of Sri Lanka", "word": "কলম্বো" }, { "code": "bg", "lang": "Bulgarian", "roman": "Kolómbo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Коло́мбо" }, { "code": "my", "lang": "Burmese", "roman": "kuilambhui", "sense": "capital of Sri Lanka", "word": "ကိုလံဘို" }, { "code": "yue", "lang": "Chinese Cantonese", "sense": "capital of Sri Lanka", "word": "科倫坡" }, { "code": "yue", "lang": "Chinese Cantonese", "roman": "fo¹ leon⁴ bo¹", "sense": "capital of Sri Lanka", "word": "科伦坡" }, { "code": "cmn", "lang": "Chinese Mandarin", "sense": "capital of Sri Lanka", "word": "科倫坡" }, { "code": "cmn", "lang": "Chinese Mandarin", "roman": "Kēlúnpō", "sense": "capital of Sri Lanka", "word": "科伦坡" }, { "code": "cmn", "lang": "Chinese Mandarin", "sense": "capital of Sri Lanka", "word": "可倫坡" }, { "code": "cmn", "lang": "Chinese Mandarin", "roman": "Kělúnpō", "sense": "capital of Sri Lanka", "word": "可伦坡" }, { "code": "cs", "lang": "Czech", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Kolombo" }, { "code": "da", "lang": "Danish", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Colombo" }, { "code": "dv", "lang": "Dhivehi", "roman": "koḷuᵐbu", "sense": "capital of Sri Lanka", "word": "ކޮޅުނބު" }, { "code": "nl", "lang": "Dutch", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Colombo" }, { "code": "eo", "lang": "Esperanto", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "et", "lang": "Estonian", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "fi", "lang": "Finnish", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "fr", "lang": "French", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "Colombo" }, { "code": "ka", "lang": "Georgian", "roman": "ḳolombo", "sense": "capital of Sri Lanka", "word": "კოლომბო" }, { "code": "de", "lang": "German", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Colombo" }, { "code": "el", "lang": "Greek", "roman": "Kolómpo", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Κολόμπο" }, { "code": "gu", "lang": "Gujarati", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "કોલંબો" }, { "code": "he", "lang": "Hebrew", "roman": "kolómbo", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "קוֹלוֹמְבּוֹ" }, { "code": "hi", "lang": "Hindi", "roman": "kolambo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "कोलंबो" }, { "code": "hu", "lang": "Hungarian", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "is", "lang": "Icelandic", "sense": "capital of Sri Lanka", "word": "Kólombó" }, { "code": "id", "lang": "Indonesian", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "ga", "lang": "Irish", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "it", "lang": "Italian", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "Colombo" }, { "code": "ja", "lang": "Japanese", "roman": "Koronbo", "sense": "capital of Sri Lanka", "word": "コロンボ" }, { "code": "kn", "lang": "Kannada", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "ಕೊಲಂಬೊ" }, { "code": "kk", "lang": "Kazakh", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "km", "lang": "Khmer", "roman": "koulombou", "sense": "capital of Sri Lanka", "word": "កូឡុំបូ" }, { "code": "ko", "lang": "Korean", "roman": "Kollombo", "sense": "capital of Sri Lanka", "word": "콜롬보" }, { "code": "kmr", "lang": "Northern Kurdish", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "ky", "lang": "Kyrgyz", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "lv", "lang": "Latvian", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "lt", "lang": "Lithuanian", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Kolombas" }, { "code": "mk", "lang": "Macedonian", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "ms", "lang": "Malay", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "ml", "lang": "Malayalam", "roman": "koḷambō", "sense": "capital of Sri Lanka", "word": "കൊളംബോ" }, { "code": "mr", "lang": "Marathi", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "कोलंबो" }, { "code": "mn", "lang": "Mongolian", "roman": "Kolombo", "sense": "capital of Sri Lanka", "tags": [ "Cyrillic" ], "word": "Коломбо" }, { "code": "ne", "lang": "Nepali", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "कोलम्बो" }, { "code": "nb", "lang": "Norwegian Bokmål", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "nn", "lang": "Norwegian Nynorsk", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "or", "lang": "Odia", "roman": "kalombo", "sense": "capital of Sri Lanka", "word": "କଲୋମ୍ବୋ" }, { "code": "ps", "lang": "Pashto", "roman": "kolāmbó", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "کولمبو" }, { "code": "fa", "lang": "Persian", "roman": "kolombo", "sense": "capital of Sri Lanka", "word": "کلمبو" }, { "code": "pl", "lang": "Polish", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Kolombo" }, { "code": "pt", "lang": "Portuguese", "sense": "capital of Sri Lanka", "tags": [ "feminine" ], "word": "Colombo" }, { "code": "pa", "lang": "Punjabi", "roman": "kolambo", "sense": "capital of Sri Lanka", "word": "ਕੋਲੰਬੋ" }, { "code": "ro", "lang": "Romanian", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "ru", "lang": "Russian", "roman": "Kolómbo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Коло́мбо" }, { "code": "sh", "lang": "Serbo-Croatian", "sense": "capital of Sri Lanka", "tags": [ "Cyrillic", "masculine" ], "word": "Коломбо" }, { "code": "sh", "lang": "Serbo-Croatian", "sense": "capital of Sri Lanka", "tags": [ "Roman", "masculine" ], "word": "Kolombo" }, { "code": "si", "lang": "Sinhalese", "roman": "koḷaᵐba", "sense": "capital of Sri Lanka", "word": "කොළඹ" }, { "code": "sk", "lang": "Slovak", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Kolombo" }, { "code": "sl", "lang": "Slovene", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Kolombo" }, { "code": "es", "lang": "Spanish", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Colombo" }, { "code": "sv", "lang": "Swedish", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "Colombo" }, { "code": "tl", "lang": "Tagalog", "sense": "capital of Sri Lanka", "word": "Colombo" }, { "code": "tg", "lang": "Tajik", "roman": "Kolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "ta", "lang": "Tamil", "roman": "koḻumpu", "sense": "capital of Sri Lanka", "word": "கொழும்பு" }, { "code": "tt", "lang": "Tatar", "roman": "Qolombo", "sense": "capital of Sri Lanka", "word": "Коломбо" }, { "code": "te", "lang": "Telugu", "roman": "kolambō", "sense": "capital of Sri Lanka", "word": "కొలంబో" }, { "code": "th", "lang": "Thai", "roman": "koo-lam-boo", "sense": "capital of Sri Lanka", "word": "โคลัมโบ" }, { "code": "bo", "lang": "Tibetan", "roman": "kho lum po", "sense": "capital of Sri Lanka", "word": "ཁོ་ལུམ་པོ" }, { "code": "tk", "lang": "Turkmen", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "uk", "lang": "Ukrainian", "roman": "Kolómbo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "Коло́мбо" }, { "code": "ur", "lang": "Urdu", "roman": "kolambo", "sense": "capital of Sri Lanka", "tags": [ "masculine" ], "word": "کولمبو" }, { "code": "ug", "lang": "Uyghur", "roman": "kolombo", "sense": "capital of Sri Lanka", "word": "كولومبو" }, { "code": "uz", "lang": "Uzbek", "sense": "capital of Sri Lanka", "word": "Kolombo" }, { "code": "vi", "lang": "Vietnamese", "sense": "capital of Sri Lanka", "word": "Cô-lôm-bô" }, { "code": "yi", "lang": "Yiddish", "roman": "kolombo", "sense": "capital of Sri Lanka", "tags": [ "neuter" ], "word": "קאָלאָמבאָ" } ], "wikipedia": [ "Colombo" ], "word": "Colombo" } { "categories": [ "English entries with incorrect language header", "English lemmas", "English proper nouns", "English terms borrowed from Italian", "English terms derived from Italian", "English uncountable nouns", "Pages with 5 entries", "Pages with entries", "Rhymes:English/ʌmbəʊ", "Rhymes:English/ʌmbəʊ/3 syllables" ], "etymology_number": 2, "etymology_templates": [ { "args": { "1": "en", "2": "it", "3": "Colombo" }, "expansion": "Italian Colombo", "name": "bor" } ], "etymology_text": "From Italian Colombo, from colombo (“pigeon, dove”).", "head_templates": [ { "args": {}, "expansion": "Colombo", "name": "en-proper noun" } ], "lang": "English", "lang_code": "en", "pos": "name", "senses": [ { "categories": [ "English surnames", "English surnames from Italian" ], "glosses": [ "A surname from Italian." ], "links": [ [ "surname", "surname" ] ] } ], "sounds": [ { "ipa": "/kəˈlɒm.bəʊ/", "tags": [ "UK" ] }, { "ipa": "/kəˈlʌm.bəʊ/", "tags": [ "UK" ] }, { "ipa": "/ˈkɒl.əm.bəʊ/", "tags": [ "UK", "also" ], "topics": [ "city", "cities", "region", "location" ] }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/47/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/47/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo.wav.ogg" }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo2.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/5/5b/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/5/5b/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo2.wav.ogg" }, { "audio": "LL-Q1860 (eng)-Vealhurl-Colombo3.wav", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/4b/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/4/4b/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav/LL-Q1860_%28eng%29-Vealhurl-Colombo3.wav.ogg" }, { "rhymes": "-ʌmbəʊ" } ], "wikipedia": [ "Colombo" ], "word": "Colombo" }
Download raw JSONL data for Colombo meaning in English (17.1kB)
This page is a part of the kaikki.org machine-readable English dictionary. This dictionary is based on structured data extracted on 2024-11-06 from the enwiktionary dump dated 2024-10-02 using wiktextract (fbeafe8 and 7f03c9b). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.