language model in All languages combined

[Show JSON for postprocessed kaikki.org data shown on this page ▼] [Hide JSON for postprocessed kaikki.org data shown on this page ▲]

{
  "forms": [
    {
      "form": "language models",
      "tags": [
        "plural"
      ]
    }
  ],
  "head_templates": [
    {
      "args": {},
      "expansion": "language model (plural language models)",
      "name": "en-noun"
    }
  ],
  "lang": "English",
  "lang_code": "en",
  "pos": "noun",
  "senses": [
    {
      "categories": [
        {
          "kind": "other",
          "name": "English entries with incorrect language header",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "name": "Entries with translation boxes",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "name": "Pages with 1 entry",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "name": "Pages with entries",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "name": "Terms with Dutch translations",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "name": "Terms with Finnish translations",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "name": "Terms with German translations",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "name": "Terms with Romanian translations",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "name": "Terms with Swedish translations",
          "parents": [],
          "source": "w"
        },
        {
          "kind": "other",
          "langcode": "en",
          "name": "Machine learning",
          "orig": "en:Machine learning",
          "parents": [],
          "source": "w"
        }
      ],
      "derived": [
        {
          "word": "large language model"
        },
        {
          "word": "small language model"
        }
      ],
      "examples": [
        {
          "bold_text_offsets": [
            [
              17,
              32
            ]
          ],
          "ref": "2022 [2009], Chengxiang Zhai, Statistical Language Models for Information Retrieval, Springer Nature, →ISBN, page 9:",
          "text": "Although unigram language models are simple, they clearly make unrealistic assumptions about word occurrences in text.",
          "type": "quote"
        }
      ],
      "glosses": [
        "A machine learning model that assigns probabilities to sequences of characters or words, and/or is capable of generating plausible subsequent text from a given prompt."
      ],
      "hypernyms": [
        {
          "word": "model#Noun"
        }
      ],
      "id": "en-language_model-en-noun-en:Q3621696",
      "links": [
        [
          "machine learning",
          "machine learning"
        ],
        [
          "model",
          "model"
        ],
        [
          "probabilities",
          "probability"
        ],
        [
          "sequences",
          "sequences"
        ],
        [
          "character",
          "character"
        ],
        [
          "word",
          "word"
        ],
        [
          "generating",
          "generate"
        ],
        [
          "plausible",
          "plausible"
        ],
        [
          "text",
          "text"
        ],
        [
          "prompt",
          "prompt"
        ]
      ],
      "qualifier": "machine learning",
      "raw_glosses": [
        "(machine learning) A machine learning model that assigns probabilities to sequences of characters or words, and/or is capable of generating plausible subsequent text from a given prompt."
      ],
      "senseid": [
        "en:Q3621696"
      ],
      "synonyms": [
        {
          "word": "LM"
        }
      ],
      "translations": [
        {
          "code": "nl",
          "lang": "Dutch",
          "lang_code": "nl",
          "sense": "ML model",
          "tags": [
            "neuter"
          ],
          "word": "taalmodel"
        },
        {
          "code": "fi",
          "lang": "Finnish",
          "lang_code": "fi",
          "sense": "ML model",
          "word": "kielimalli"
        },
        {
          "code": "de",
          "lang": "German",
          "lang_code": "de",
          "sense": "ML model",
          "tags": [
            "neuter"
          ],
          "word": "Sprachmodell"
        },
        {
          "code": "ro",
          "lang": "Romanian",
          "lang_code": "ro",
          "sense": "ML model",
          "tags": [
            "neuter"
          ],
          "word": "model de limbă"
        },
        {
          "code": "sv",
          "lang": "Swedish",
          "lang_code": "sv",
          "sense": "ML model",
          "tags": [
            "common-gender"
          ],
          "word": "språkmodell"
        }
      ],
      "wikidata": [
        "Q3621696"
      ]
    }
  ],
  "word": "language model"
}

[Show JSON for raw wiktextract data ▼] [Hide JSON for raw wiktextract data ▲]

{
  "derived": [
    {
      "word": "large language model"
    },
    {
      "word": "small language model"
    }
  ],
  "forms": [
    {
      "form": "language models",
      "tags": [
        "plural"
      ]
    }
  ],
  "head_templates": [
    {
      "args": {},
      "expansion": "language model (plural language models)",
      "name": "en-noun"
    }
  ],
  "lang": "English",
  "lang_code": "en",
  "pos": "noun",
  "senses": [
    {
      "categories": [
        "English countable nouns",
        "English entries with incorrect language header",
        "English lemmas",
        "English multiword terms",
        "English nouns",
        "English terms with quotations",
        "Entries with translation boxes",
        "Pages with 1 entry",
        "Pages with entries",
        "Terms with Dutch translations",
        "Terms with Finnish translations",
        "Terms with German translations",
        "Terms with Romanian translations",
        "Terms with Swedish translations",
        "en:Machine learning"
      ],
      "examples": [
        {
          "bold_text_offsets": [
            [
              17,
              32
            ]
          ],
          "ref": "2022 [2009], Chengxiang Zhai, Statistical Language Models for Information Retrieval, Springer Nature, →ISBN, page 9:",
          "text": "Although unigram language models are simple, they clearly make unrealistic assumptions about word occurrences in text.",
          "type": "quote"
        }
      ],
      "glosses": [
        "A machine learning model that assigns probabilities to sequences of characters or words, and/or is capable of generating plausible subsequent text from a given prompt."
      ],
      "hypernyms": [
        {
          "word": "model#Noun"
        }
      ],
      "links": [
        [
          "machine learning",
          "machine learning"
        ],
        [
          "model",
          "model"
        ],
        [
          "probabilities",
          "probability"
        ],
        [
          "sequences",
          "sequences"
        ],
        [
          "character",
          "character"
        ],
        [
          "word",
          "word"
        ],
        [
          "generating",
          "generate"
        ],
        [
          "plausible",
          "plausible"
        ],
        [
          "text",
          "text"
        ],
        [
          "prompt",
          "prompt"
        ]
      ],
      "qualifier": "machine learning",
      "raw_glosses": [
        "(machine learning) A machine learning model that assigns probabilities to sequences of characters or words, and/or is capable of generating plausible subsequent text from a given prompt."
      ],
      "senseid": [
        "en:Q3621696"
      ],
      "synonyms": [
        {
          "word": "LM"
        }
      ],
      "wikidata": [
        "Q3621696"
      ]
    }
  ],
  "translations": [
    {
      "code": "nl",
      "lang": "Dutch",
      "lang_code": "nl",
      "sense": "ML model",
      "tags": [
        "neuter"
      ],
      "word": "taalmodel"
    },
    {
      "code": "fi",
      "lang": "Finnish",
      "lang_code": "fi",
      "sense": "ML model",
      "word": "kielimalli"
    },
    {
      "code": "de",
      "lang": "German",
      "lang_code": "de",
      "sense": "ML model",
      "tags": [
        "neuter"
      ],
      "word": "Sprachmodell"
    },
    {
      "code": "ro",
      "lang": "Romanian",
      "lang_code": "ro",
      "sense": "ML model",
      "tags": [
        "neuter"
      ],
      "word": "model de limbă"
    },
    {
      "code": "sv",
      "lang": "Swedish",
      "lang_code": "sv",
      "sense": "ML model",
      "tags": [
        "common-gender"
      ],
      "word": "språkmodell"
    }
  ],
  "word": "language model"
}

Download raw JSONL data for language model meaning in All languages combined (2.5kB)

This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2025-12-15 from the enwiktionary dump dated 2025-12-02 using wiktextract (e2469cc and 9905b1f). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.

If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.

"language model" meaning in All languages combined

Noun [English]

Inflected forms

Alternative forms