ISSR_Visual_Model / ctfidf_config.json
D0men1c0's picture
Add BERTopic model
c6e22f4 verified
raw
history blame contribute delete
654 Bytes
{
"ctfidf_model": {
"bm25_weighting": false,
"reduce_frequent_words": true
},
"vectorizer_model": {
"params": {
"analyzer": "word",
"binary": false,
"decode_error": "strict",
"encoding": "utf-8",
"input": "content",
"lowercase": true,
"max_df": 1.0,
"max_features": null,
"min_df": 1,
"ngram_range": [
1,
1
],
"stop_words": "english",
"strip_accents": null,
"token_pattern": "(?u)\\b\\w\\w+\\b",
"vocabulary": null
},
"vocab": {
"gun": 1,
"drug": 0,
"people": 2
}
}
}