Versions Compared

Key

  • This line was added.
  • This line was removed.
  • Formatting was changed.

...

Code Block
languagejson
{
    "add_lemmization": false, # add lemmization to the words
    "cache_lemmas": false, # save the lemmas in a cache to improve the peroformancesperformances
    "filter_list": [], # List of terms you do not want to see
    "input_field": [ "body"], # where get the input text
    "max_chunk_len": 2, # minmax number of words in a chunk
    "min_word_len": 4, #  min character in a words
    "output_field": "terms", #where# where store the output (list)
    "p_significant_terms": 0.2,  # % of important terms to pickup
    "save_model": true, # #savesave the generate model
    "step": "embedder",
    "type": "terms_extraction"
},

...