See caheip on Wiktionary
{ "etymology_templates": [ { "args": { "1": "pac", "2": "mkh-kat-pro", "3": "*kaheep" }, "expansion": "Proto-Katuic *kaheep", "name": "inh" }, { "args": { "1": "pac", "2": "mkh-pro", "3": "-" }, "expansion": "Proto-Mon-Khmer", "name": "inh" }, { "args": { "1": "sea", "2": "ke'èèp" }, "expansion": "Semai ke'èèp", "name": "cog" }, { "args": { "1": "bdq", "2": "kơep" }, "expansion": "Bahnar kơep", "name": "cog" }, { "args": { "1": "hal", "2": "gơjip" }, "expansion": "Halang gơjip", "name": "cog" }, { "args": { "1": "km", "2": "ក្អែប" }, "expansion": "Khmer ក្អែប (kʼaep)", "name": "cog" }, { "args": { "1": "kjg", "2": "-" }, "expansion": "Khmu", "name": "cog" }, { "args": { "1": "ncb", "2": "-" }, "expansion": "Central Nicobarese", "name": "cog" }, { "args": { "1": "lbn", "2": "-" }, "expansion": "Lamet", "name": "cog" }, { "args": { "1": "thm", "2": "-" }, "expansion": "Thavung", "name": "cog" }, { "args": { "1": "aem", "2": "-" }, "expansion": "Arem", "name": "cog" }, { "args": { "1": "*-h-" }, "expansion": "*-h-", "name": "IPAfont" }, { "args": { "1": "*-s-" }, "expansion": "*-s-", "name": "IPAfont" }, { "args": { "1": "*-h-" }, "expansion": "*-h-", "name": "IPAfont" }, { "args": { "1": "*-h-" }, "expansion": "*-h-", "name": "IPAfont" }, { "args": { "1": "*-ɟ-" }, "expansion": "*-ɟ-", "name": "IPAfont" } ], "etymology_text": "From Proto-Katuic *kaheep, from Proto-Mon-Khmer. Cognate with Semai ke'èèp, Bahnar kơep, Halang gơjip, Khmer ក្អែប (kʼaep), Khmu [Cuang] kʔiːp, Central Nicobarese [Nancowry] kaēap, Lamet [Lambang] səʔíp, Thavung kasḭ̂ːp, Arem katʰɪːp.\nKatuic has *-h- for this word; Khmer, Aslian and Nicobarese have zero consonant; Vietic and (possibly) Palaungic have *-s-; Khmuic is inconclusive for either *-h- or zero-consonant (since *-h- was already lost at Proto-Khmuic stage, it is not possible to tell); Bahnaric reflexes are split between those that show zero consonant (such as Bahnar) and those that show *-ɟ- (such as Halang).", "head_templates": [ { "args": { "1": "pac", "2": "noun", "head": "" }, "expansion": "caheip", "name": "head" }, { "args": {}, "expansion": "caheip", "name": "pac-noun" } ], "lang": "Pacoh", "lang_code": "pac", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Pacoh entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" } ], "glosses": [ "centipede" ], "id": "en-caheip-pac-noun-YZiPLanh", "links": [ [ "centipede", "centipede" ] ], "qualifier": "Tal-ay dialect", "raw_glosses": [ "(Tal-ay dialect) centipede" ], "synonyms": [ { "alt": "Pahi Tamprin, Pahi Axap, Kadô", "word": "cahep" } ] } ], "sounds": [ { "ipa": "[kahḭːp]" } ], "word": "caheip" }
{ "etymology_templates": [ { "args": { "1": "pac", "2": "mkh-kat-pro", "3": "*kaheep" }, "expansion": "Proto-Katuic *kaheep", "name": "inh" }, { "args": { "1": "pac", "2": "mkh-pro", "3": "-" }, "expansion": "Proto-Mon-Khmer", "name": "inh" }, { "args": { "1": "sea", "2": "ke'èèp" }, "expansion": "Semai ke'èèp", "name": "cog" }, { "args": { "1": "bdq", "2": "kơep" }, "expansion": "Bahnar kơep", "name": "cog" }, { "args": { "1": "hal", "2": "gơjip" }, "expansion": "Halang gơjip", "name": "cog" }, { "args": { "1": "km", "2": "ក្អែប" }, "expansion": "Khmer ក្អែប (kʼaep)", "name": "cog" }, { "args": { "1": "kjg", "2": "-" }, "expansion": "Khmu", "name": "cog" }, { "args": { "1": "ncb", "2": "-" }, "expansion": "Central Nicobarese", "name": "cog" }, { "args": { "1": "lbn", "2": "-" }, "expansion": "Lamet", "name": "cog" }, { "args": { "1": "thm", "2": "-" }, "expansion": "Thavung", "name": "cog" }, { "args": { "1": "aem", "2": "-" }, "expansion": "Arem", "name": "cog" }, { "args": { "1": "*-h-" }, "expansion": "*-h-", "name": "IPAfont" }, { "args": { "1": "*-s-" }, "expansion": "*-s-", "name": "IPAfont" }, { "args": { "1": "*-h-" }, "expansion": "*-h-", "name": "IPAfont" }, { "args": { "1": "*-h-" }, "expansion": "*-h-", "name": "IPAfont" }, { "args": { "1": "*-ɟ-" }, "expansion": "*-ɟ-", "name": "IPAfont" } ], "etymology_text": "From Proto-Katuic *kaheep, from Proto-Mon-Khmer. Cognate with Semai ke'èèp, Bahnar kơep, Halang gơjip, Khmer ក្អែប (kʼaep), Khmu [Cuang] kʔiːp, Central Nicobarese [Nancowry] kaēap, Lamet [Lambang] səʔíp, Thavung kasḭ̂ːp, Arem katʰɪːp.\nKatuic has *-h- for this word; Khmer, Aslian and Nicobarese have zero consonant; Vietic and (possibly) Palaungic have *-s-; Khmuic is inconclusive for either *-h- or zero-consonant (since *-h- was already lost at Proto-Khmuic stage, it is not possible to tell); Bahnaric reflexes are split between those that show zero consonant (such as Bahnar) and those that show *-ɟ- (such as Halang).", "head_templates": [ { "args": { "1": "pac", "2": "noun", "head": "" }, "expansion": "caheip", "name": "head" }, { "args": {}, "expansion": "caheip", "name": "pac-noun" } ], "lang": "Pacoh", "lang_code": "pac", "pos": "noun", "senses": [ { "categories": [ "Pacoh entries with incorrect language header", "Pacoh lemmas", "Pacoh nouns", "Pacoh terms derived from Proto-Katuic", "Pacoh terms derived from Proto-Mon-Khmer", "Pacoh terms inherited from Proto-Katuic", "Pacoh terms inherited from Proto-Mon-Khmer", "Pages with 1 entry", "Pages with entries" ], "glosses": [ "centipede" ], "links": [ [ "centipede", "centipede" ] ], "qualifier": "Tal-ay dialect", "raw_glosses": [ "(Tal-ay dialect) centipede" ] } ], "sounds": [ { "ipa": "[kahḭːp]" } ], "synonyms": [ { "alt": "Pahi Tamprin, Pahi Axap, Kadô", "word": "cahep" } ], "word": "caheip" }
Download raw JSONL data for caheip meaning in All languages combined (2.7kB)
This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2025-02-15 from the enwiktionary dump dated 2025-02-02 using wiktextract (ca09fec and c40eb85). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.