JSON data structure browser

Download full JSON mapping

Fields and tags index

The raw JSON data used to generate this site consists of individual JSON object for each separate word. The browser here is a union of all these objects combined into one, by recursively delving through each of them and adding newly found nodes in a parallel mapping.

{
"anagrams":
[
{
"word": word seen in progeny [Bahasa Inggeris]; reached 144 times
}
]
"antonyms":
[
{
"sense": sense seen in oxidation [Bahasa Inggeris]; reached 392 times,
"word": word seen in abactinal [Bahasa Inggeris]; reached 848 times
}
]
"categories":
[categories seen in Wikipedia [Bahasa Inggeris]; reached 387682 times]
"classifiers":
[
{
"classifier": classifier seen in เพลง [Bahasa Thai]; reached 45 times,
"raw_tags":
[raw_tags seen in เพลง [Bahasa Thai]; reached 44 times]
}
]
"coordinate_terms":
[
{
"sense": sense seen in SoKor [Bahasa Inggeris]; reached 105 times,
"word": word seen in SoKor [Bahasa Inggeris]; reached 105 times
}
]
"derived":
[
{
"sense": sense seen in adjutant [Bahasa Inggeris]; reached 220 times,
"word": word seen in punctilio [Bahasa Inggeris]; reached 18996 times
}
]
"etymology_texts":
[etymology_texts seen in Wikipedia [Bahasa Inggeris]; reached 16817 times]
"forms":
[
{
"form": form seen in grouser [Bahasa Inggeris]; reached 28448 times,
"raw_tags":
[raw_tags seen in grouser [Bahasa Inggeris]; reached 11179 times]
"tags":
[tags seen in the early bird gets the worm [Bahasa Inggeris]; reached 17265 times]
}
]
"hypernyms":
[
{
"sense": sense seen in all in [Bahasa Inggeris]; reached 5 times,
"word": word seen in all in [Bahasa Inggeris]; reached 5 times
}
]
"hyphenations":
[
{
"parts":
[parts seen in lexicography [Bahasa Inggeris]; reached 38264 times]
}
]
"hyponyms":
[
{
"sense": sense seen in regicide [Bahasa Inggeris]; reached 15 times,
"word": word seen in regicide [Bahasa Inggeris]; reached 15 times
}
]
"lang": lang seen in Wikipedia [Bahasa Inggeris]; reached 75925 times,
"lang_code": lang_code seen in Wikipedia [Bahasa Inggeris]; reached 75925 times,
"notes":
[notes seen in calendar [Bahasa Inggeris]; reached 256 times]
"pos": pos seen in Wikipedia [Bahasa Inggeris]; reached 75925 times,
"pos_title": pos_title seen in grouser [Bahasa Inggeris]; reached 72020 times,
"proverbs":
[
{
"sense": sense seen in bahasa [Bahasa Melayu]; reached 20 times,
"word": word seen in the early bird gets the worm [Bahasa Inggeris]; reached 67 times
}
]
"related":
[
{
"sense": sense seen in [Bahasa Jepun]; reached 3 times,
"word": word seen in the early bird gets the worm [Bahasa Inggeris]; reached 281 times
}
]
"senses":
[
{
"alt_of":
[
{
"word": word seen in goat [Bahasa Inggeris]; reached 5 times
}
]
"attestations":
[
{
"date": date seen in hard word [Bahasa Inggeris]; reached 23 times
}
]
"categories":
[categories seen in grouser [Bahasa Inggeris]; reached 28276 times]
"examples":
[
{
"bold_literal_offsets":
[
[bold_literal_offsets seen in nanam [Bahasa Suluk]; reached 6 times]
]
"bold_roman_offsets":
[
[bold_roman_offsets seen in bertemper [Bahasa Melayu]; reached 140 times]
]
"bold_text_offsets":
[
[bold_text_offsets seen in BMTH [Bahasa Inggeris]; reached 36294 times]
]
"bold_translation_offsets":
[
[bold_translation_offsets seen in yur [Bahasa Inggeris]; reached 34996 times]
]
"literal_meaning": literal_meaning seen in nanam [Bahasa Suluk]; reached 5 times,
"ref": ref seen in BMTH [Bahasa Inggeris]; reached 305 times,
"roman": roman seen in bertemper [Bahasa Melayu]; reached 111 times,
"text": text seen in BMTH [Bahasa Inggeris]; reached 20391 times,
"translation": translation seen in yur [Bahasa Inggeris]; reached 19579 times
}
]
"form_of":
[
{
"word": word seen in SBP [Bahasa Inggeris]; reached 1886 times
}
]
"glosses":
[glosses seen in grouser [Bahasa Inggeris]; reached 84244 times]
"raw_tags":
[raw_tags seen in essay [Bahasa Inggeris]; reached 3221 times]
"tags":
[tags seen in Wikipedia [Bahasa Inggeris]; reached 7379 times]
"topics":
[topics seen in grouser [Bahasa Inggeris]; reached 3658 times]
}
]
"sounds":
[
{
"audio": audio seen in poster boy [Bahasa Inggeris]; reached 4168 times,
"flac_url": flac_url seen in siku kuu [Bahasa Swahili]; reached 7 times,
"hangeul": hangeul seen in 신경 [Bahasa Korea]; reached 149 times,
"ipa": ipa seen in essay [Bahasa Inggeris]; reached 15220 times,
"mp3_url": mp3_url seen in poster boy [Bahasa Inggeris]; reached 4168 times,
"oga_url": oga_url seen in verso [Bahasa Inggeris]; reached 43 times,
"ogg_url": ogg_url seen in poster boy [Bahasa Inggeris]; reached 4126 times,
"opus_url": opus_url seen in ethyl [Bahasa Inggeris]; reached 4 times,
"other": other seen in ihram [Bahasa Inggeris]; reached 7025 times,
"raw_tags":
[raw_tags seen in crore [Bahasa Inggeris]; reached 8317 times]
"rhymes": rhymes seen in grouser [Bahasa Inggeris]; reached 8229 times,
"roman": roman seen in 신경 [Bahasa Korea]; reached 529 times,
"tags":
[tags seen in lexicography [Bahasa Inggeris]; reached 2558 times]
"wav_url": wav_url seen in Palestine [Bahasa Inggeris]; reached 1152 times
}
]
"synonyms":
[
{
"sense": sense seen in sugar apple [Bahasa Inggeris]; reached 2803 times,
"word": word seen in sugar apple [Bahasa Inggeris]; reached 5272 times
}
]
"tags":
[tags seen in hetero- [Bahasa Inggeris]; reached 2493 times]
"translations":
[
{
"lang": lang seen in abactinal [Bahasa Inggeris]; reached 33725 times,
"lang_code": lang_code seen in abactinal [Bahasa Inggeris]; reached 33725 times,
"raw_tags":
[raw_tags seen in d'oh [Bahasa Inggeris]; reached 1354 times]
"roman": roman seen in the early bird gets the worm [Bahasa Inggeris]; reached 11053 times,
"sense": sense seen in abactinal [Bahasa Inggeris]; reached 33547 times,
"source": source seen in Rōmaji [Bahasa Inggeris]; reached 385 times,
"tags":
[tags seen in gravity [Bahasa Inggeris]; reached 13322 times]
"word": word seen in abactinal [Bahasa Inggeris]; reached 33725 times
}
]
"word": word seen in Wikipedia [Bahasa Inggeris]; reached 75925 times
}

This page is a part of the kaikki.org machine-readable dictionary. This dictionary is based on structured data extracted on 2026-07-03 from the mswiktionary dump dated 2026-06-01 using wiktextract (3a98e1b and 7f4db16). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.

If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.