See Unihan on Wiktionary
{ "etymology_templates": [ { "args": { "1": "en", "2": "uni", "3": "Han" }, "expansion": "uni- + Han", "name": "prefix" } ], "etymology_text": "From uni- + Han.", "head_templates": [ { "args": {}, "expansion": "Unihan", "name": "en-proper noun" } ], "lang": "English", "lang_code": "en", "pos": "name", "senses": [ { "categories": [ { "kind": "other", "name": "English entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "English terms prefixed with uni-", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with 1 entry", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "kind": "topical", "langcode": "en", "name": "Computing", "orig": "en:Computing", "parents": [ "Technology", "All topics", "Fundamental" ], "source": "w" }, { "kind": "topical", "langcode": "en", "name": "Typography", "orig": "en:Typography", "parents": [ "Printing", "Writing", "Industries", "Human behaviour", "Language", "Business", "Human", "Communication", "Economics", "Society", "All topics", "Social sciences", "Fundamental", "Sciences" ], "source": "w" } ], "glosses": [ "A character set, a subset of Unicode, that attempts to unify the regional and historical variants of Han characters by treating them as different glyphs representing the same grapheme." ], "id": "en-Unihan-en-name-6KdSR3Xu", "links": [ [ "computing", "computing#Noun" ], [ "typography", "typography" ], [ "character set", "character set" ], [ "subset", "subset" ], [ "Unicode", "Unicode" ], [ "unify", "unify" ], [ "Han", "Han" ], [ "glyph", "glyph" ], [ "grapheme", "grapheme" ] ], "raw_glosses": [ "(computing, typography) A character set, a subset of Unicode, that attempts to unify the regional and historical variants of Han characters by treating them as different glyphs representing the same grapheme." ], "topics": [ "computing", "engineering", "mathematics", "media", "natural-sciences", "physical-sciences", "publishing", "sciences", "typography" ], "wikipedia": [ "Unihan" ] } ], "sounds": [ { "audio": "en-uk-Unihan.ogg", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/8/8f/En-uk-Unihan.ogg/En-uk-Unihan.ogg.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/8/8f/En-uk-Unihan.ogg" } ], "word": "Unihan" }
{ "etymology_templates": [ { "args": { "1": "en", "2": "uni", "3": "Han" }, "expansion": "uni- + Han", "name": "prefix" } ], "etymology_text": "From uni- + Han.", "head_templates": [ { "args": {}, "expansion": "Unihan", "name": "en-proper noun" } ], "lang": "English", "lang_code": "en", "pos": "name", "senses": [ { "categories": [ "English entries with incorrect language header", "English lemmas", "English proper nouns", "English terms prefixed with uni-", "English uncountable nouns", "Pages with 1 entry", "Pages with entries", "en:Computing", "en:Typography" ], "glosses": [ "A character set, a subset of Unicode, that attempts to unify the regional and historical variants of Han characters by treating them as different glyphs representing the same grapheme." ], "links": [ [ "computing", "computing#Noun" ], [ "typography", "typography" ], [ "character set", "character set" ], [ "subset", "subset" ], [ "Unicode", "Unicode" ], [ "unify", "unify" ], [ "Han", "Han" ], [ "glyph", "glyph" ], [ "grapheme", "grapheme" ] ], "raw_glosses": [ "(computing, typography) A character set, a subset of Unicode, that attempts to unify the regional and historical variants of Han characters by treating them as different glyphs representing the same grapheme." ], "topics": [ "computing", "engineering", "mathematics", "media", "natural-sciences", "physical-sciences", "publishing", "sciences", "typography" ], "wikipedia": [ "Unihan" ] } ], "sounds": [ { "audio": "en-uk-Unihan.ogg", "mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/8/8f/En-uk-Unihan.ogg/En-uk-Unihan.ogg.mp3", "ogg_url": "https://upload.wikimedia.org/wikipedia/commons/8/8f/En-uk-Unihan.ogg" } ], "word": "Unihan" }
Download raw JSONL data for Unihan meaning in All languages combined (1.6kB)
This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2024-11-06 from the enwiktionary dump dated 2024-10-02 using wiktextract (fbeafe8 and 7f03c9b). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.