JSON data structure browser

Download full JSON mapping

Fields and tags index

The raw JSON data used to generate this site consists of individual JSON object for each separate word. The browser here is a union of all these objects combined into one, by recursively delving through each of them and adding newly found nodes in a parallel mapping.

{
"antonyms":
[
{
"raw_tags":
[raw_tags seen in pořádně [čeština]; reached 214 times]
"sense_index": sense_index seen in jednou [čeština]; reached 21071 times,
"tags":
[tags seen in pyšný [čeština]; reached 278 times]
"word": word seen in jednou [čeština]; reached 21429 times
}
]
"categories":
[categories seen in ligami [čeština]; reached 316443 times]
"derived":
[
{
"word": word seen in 訳す [japonština]; reached 205 times
}
]
"etymology_texts":
[etymology_texts seen in být v limbu [čeština]; reached 31455 times]
"forms":
[
{
"form": form seen in tuberkulóza [čeština]; reached 1608901 times,
"raw_tags":
[raw_tags seen in pankově [čeština]; reached 430279 times]
"roman": roman seen in 訳す [japonština]; reached 411 times,
"tags":
[tags seen in tuberkulóza [čeština]; reached 4893056 times]
}
]
"hyphenations":
[
{
"parts":
[parts seen in ligami [čeština]; reached 217769 times]
}
]
"lang": lang seen in ligami [čeština]; reached 190591 times,
"lang_code": lang_code seen in ligami [čeština]; reached 190591 times,
"note": note seen in saan [tagalog]; reached 21 times,
"phrases":
[
{
"word": word seen in píše [čeština]; reached 10 times
}
]
"pos": pos seen in ligami [čeština]; reached 190591 times,
"pos_title": pos_title seen in ligami [čeština]; reached 190591 times,
"proverbs":
[
{
"sense_index": sense_index seen in šplouchat [čeština]; reached 4 times,
"word": word seen in nový [čeština]; reached 1563 times
}
]
"raw_tags":
[raw_tags seen in cestujících [čeština]; reached 62358 times]
"related":
[
{
"raw_tags":
[raw_tags seen in drát [čeština]; reached 12 times]
"sense_index": sense_index seen in muzikant [čeština]; reached 781 times,
"tags":
[tags seen in muzikant [čeština]; reached 41 times]
"word": word seen in tuberkulóza [čeština]; reached 263629 times
}
]
"senses":
[
{
"categories":
[categories seen in bělina [čeština]; reached 32151 times]
"examples":
[
{
"bold_text_offsets":
[
[bold_text_offsets seen in žíněnka [čeština]; reached 44900 times]
]
"ref": ref seen in cestujících [čeština]; reached 31157 times,
"text": text seen in cestujících [čeština]; reached 56073 times,
"translation": translation seen in žíněnka [čeština]; reached 10889 times
}
]
"form_of":
[
{
"word": word seen in ligami [čeština]; reached 92410 times
}
]
"glosses":
[glosses seen in ligami [čeština]; reached 284811 times]
"raw_tags":
[raw_tags seen in vašeta [čeština]; reached 8684 times]
"tags":
[tags seen in ligami [čeština]; reached 113783 times]
"topics":
[topics seen in albinizmus [čeština]; reached 14559 times]
}
]
"sounds":
[
{
"audio": audio seen in překvapení [čeština]; reached 40035 times,
"flac_url": flac_url seen in rain fire and brimstone [angličtina]; reached 12 times,
"homophone": homophone seen in trápily [čeština]; reached 26892 times,
"ipa": ipa seen in ligami [čeština]; reached 162642 times,
"mp3_url": mp3_url seen in překvapení [čeština]; reached 40035 times,
"oga_url": oga_url seen in aspik [čeština]; reached 225 times,
"ogg_url": ogg_url seen in překvapení [čeština]; reached 39811 times,
"opus_url": opus_url seen in Athens [angličtina]; reached 5 times,
"other": other seen in внимательный [ruština]; reached 887 times,
"raw_tags":
[raw_tags seen in diva [čeština]; reached 5082 times]
"tags":
[tags seen in buďte [čeština]; reached 885 times]
"wav_url": wav_url seen in hradiště [čeština]; reached 3133 times,
"zh_pron": zh_pron seen in 籀文 [čínština]; reached 629 times
}
]
"synonyms":
[
{
"raw_tags":
[raw_tags seen in tuberkulóza [čeština]; reached 4096 times]
"sense_index": sense_index seen in tuberkulóza [čeština]; reached 105482 times,
"tags":
[tags seen in tuberkulóza [čeština]; reached 9519 times]
"word": word seen in tuberkulóza [čeština]; reached 107275 times
}
]
"tags":
[tags seen in ligami [čeština]; reached 131583 times]
"translations":
[
{
"lang": lang seen in tuberkulóza [čeština]; reached 232124 times,
"lang_code": lang_code seen in tuberkulóza [čeština]; reached 232124 times,
"raw_tags":
[raw_tags seen in žula [čeština]; reached 1275 times]
"sense": sense seen in tuberkulóza [čeština]; reached 204516 times,
"sense_index": sense_index seen in tuberkulóza [čeština]; reached 232124 times,
"tags":
[tags seen in tuberkulóza [čeština]; reached 92585 times]
"word": word seen in tuberkulóza [čeština]; reached 232124 times
}
]
"word": word seen in ligami [čeština]; reached 190591 times
}

This page is a part of the kaikki.org machine-readable dictionary. This dictionary is based on structured data extracted on 2026-02-27 from the cswiktionary dump dated 2026-02-02 using wiktextract (c4ca749 and 59dc20b). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.

If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.