{ "ctfidf_model": { "bm25_weighting": false, "reduce_frequent_words": true }, "vectorizer_model": { "params": { "analyzer": "word", "binary": false, "decode_error": "strict", "encoding": "utf-8", "input": "content", "lowercase": true, "max_df": 1.0, "max_features": null, "min_df": 1, "ngram_range": [ 1, 1 ], "stop_words": "english", "strip_accents": null, "token_pattern": "(?u)\\b\\w\\w+\\b", "vocabulary": null }, "vocab": { "gun": 1, "drug": 0, "people": 2 } } }