JSON data structure browser

Download full JSON mapping

Fields and tags index

The raw JSON data used to generate this site consists of individual JSON object for each separate word. The browser here is a union of all these objects combined into one, by recursively delving through each of them and adding newly found nodes in a parallel mapping.

{
"abbreviations":
[
{
"sense_index": sense_index seen in chilský [čeština]; reached 122 times,
"word": word seen in eventuálně [čeština]; reached 182 times
}
]
"antonyms":
[
{
"raw_tags":
[raw_tags seen in jemně [čeština]; reached 212 times]
"sense_index": sense_index seen in obrovský [čeština]; reached 20726 times,
"tags":
[tags seen in jemně [čeština]; reached 278 times]
"word": word seen in obrovský [čeština]; reached 21085 times
}
]
"categories":
[categories seen in [čeština]; reached 312554 times]
"derived":
[
{
"word": word seen in 洗う [japonština]; reached 199 times
}
]
"etymology_texts":
[etymology_texts seen in house [čeština]; reached 29290 times]
"forms":
[
{
"form": form seen in [čeština]; reached 1596596 times,
"raw_tags":
[raw_tags seen in Helsinky [čeština]; reached 1350715 times]
"tags":
[tags seen in [čeština]; reached 3894649 times]
}
]
"hyphenations":
[
{
"parts":
[parts seen in [čeština]; reached 207663 times]
}
]
"lang": lang seen in [čeština]; reached 181267 times,
"lang_code": lang_code seen in [čeština]; reached 181267 times,
"note": note seen in tiyo [tagalog]; reached 16 times,
"phrases":
[
{
"raw_tags":
[raw_tags seen in území [čeština]; reached 15 times]
"sense_index": sense_index seen in pifka [čeština]; reached 131 times,
"tags":
[tags seen in recepis [čeština]; reached 3 times]
"word": word seen in jihomoravský [čeština]; reached 15400 times
}
]
"pos": pos seen in [čeština]; reached 181267 times,
"pos_title": pos_title seen in [čeština]; reached 181267 times,
"proverbs":
[
{
"sense_index": sense_index seen in kvapný [čeština]; reached 11 times,
"word": word seen in štěkat [čeština]; reached 1558 times
}
]
"raw_tags":
[raw_tags seen in [čeština]; reached 61905 times]
"related":
[
{
"raw_tags":
[raw_tags seen in drát [čeština]; reached 12 times]
"sense_index": sense_index seen in multidisciplinární [čeština]; reached 777 times,
"tags":
[tags seen in bachor [čeština]; reached 41 times]
"word": word seen in house [čeština]; reached 258229 times
}
]
"senses":
[
{
"categories":
[categories seen in desk [čeština]; reached 31359 times]
"examples":
[
{
"bold_text_offsets":
[
[bold_text_offsets seen in [čeština]; reached 43220 times]
]
"ref": ref seen in [čeština]; reached 30660 times,
"text": text seen in [čeština]; reached 55385 times,
"translation": translation seen in zpyták [čeština]; reached 10725 times
}
]
"form_of":
[
{
"word": word seen in desk [čeština]; reached 76868 times
}
]
"glosses":
[glosses seen in [čeština]; reached 266647 times]
"raw_tags":
[raw_tags seen in zpyták [čeština]; reached 8518 times]
"tags":
[tags seen in house [čeština]; reached 97153 times]
"topics":
[topics seen in alveolopalatála [čeština]; reached 14204 times]
}
]
"sounds":
[
{
"audio": audio seen in Helsinky [čeština]; reached 36791 times,
"flac_url": flac_url seen in rain fire and brimstone [angličtina]; reached 9 times,
"homophone": homophone seen in čubka [čeština]; reached 24121 times,
"ipa": ipa seen in [čeština]; reached 153509 times,
"mp3_url": mp3_url seen in Helsinky [čeština]; reached 36791 times,
"oga_url": oga_url seen in [čeština]; reached 204 times,
"ogg_url": ogg_url seen in Helsinky [čeština]; reached 36588 times,
"opus_url": opus_url seen in Athens [angličtina]; reached 5 times,
"other": other seen in вредитель [ruština]; reached 882 times,
"raw_tags":
[raw_tags seen in fluor [čeština]; reached 4849 times]
"tags":
[tags seen in tvůj [čeština]; reached 386 times]
"wav_url": wav_url seen in skutečnost [čeština]; reached 2645 times,
"zh_pron": zh_pron seen in [čínština]; reached 255 times
}
]
"synonyms":
[
{
"raw_tags":
[raw_tags seen in srdeční [čeština]; reached 4126 times]
"sense_index": sense_index seen in [čeština]; reached 102991 times,
"tags":
[tags seen in desk [čeština]; reached 9275 times]
"word": word seen in [čeština]; reached 104749 times
}
]
"tags":
[tags seen in house [čeština]; reached 123132 times]
"translations":
[
{
"lang": lang seen in [čeština]; reached 227804 times,
"lang_code": lang_code seen in [čeština]; reached 227804 times,
"raw_tags":
[raw_tags seen in laktóza [čeština]; reached 1256 times]
"sense": sense seen in [čeština]; reached 201567 times,
"sense_index": sense_index seen in [čeština]; reached 227804 times,
"tags":
[tags seen in house [čeština]; reached 91316 times]
"word": word seen in [čeština]; reached 227804 times
}
]
"word": word seen in [čeština]; reached 181267 times
}

This page is a part of the kaikki.org machine-readable dictionary. This dictionary is based on structured data extracted on 2025-10-07 from the cswiktionary dump dated 2025-10-01 using wiktextract (19bd8d3 and 1ab82da). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.

If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.