davidmezzetti commited on
Commit
ab197d9
·
1 Parent(s): dd4c57a
Files changed (4) hide show
  1. README.md +24 -0
  2. config.json +31 -0
  3. model.safetensors +3 -0
  4. vocab.json +0 -0
README.md ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - audio
4
+ - text-to-speech
5
+ - onnx
6
+ inference: false
7
+ language: en
8
+ license: cc-by-sa-3.0
9
+ library_name: staticvectors
10
+ ---
11
+
12
+ # Language Detection with StaticVectors
13
+
14
+ This model is an export of this [FastText Language Identification model](https://fasttext.cc/docs/en/language-identification.html) for [`staticvectors`](https://github.com/neuml/staticvectors). `staticvectors` enables running inference Python with NumPy, helping it maintain solid runtime performance.
15
+
16
+
17
+ ## Usage with StaticVectors
18
+
19
+ ```python
20
+ from staticvectors import StaticVectors
21
+
22
+ model = StaticVectors("NeuML/language-id")
23
+ model.predict(["What language is this text?"])
24
+ ```
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "staticvectors",
3
+ "format": "fasttext",
4
+ "source": "lid.176.bin",
5
+ "lr": 0.05,
6
+ "dim": 16,
7
+ "ws": 5,
8
+ "epoch": 10,
9
+ "min_count": 1000,
10
+ "min_count_label": 0,
11
+ "neg": 5,
12
+ "word_ngrams": 1,
13
+ "loss": "hs",
14
+ "model": "supervised",
15
+ "bucket": 2000000,
16
+ "minn": 2,
17
+ "maxn": 4,
18
+ "thread": 12,
19
+ "lr_update_rate": 100,
20
+ "t": 0.0001,
21
+ "label": "__label__",
22
+ "verbose": 2,
23
+ "pretrained_vectors": "",
24
+ "save_output": false,
25
+ "seed": 0,
26
+ "qout": false,
27
+ "retrain": false,
28
+ "qnorm": false,
29
+ "cutoff": 0,
30
+ "dsub": 2
31
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f13c8aa2cf8800d86fe86ce9b568e69d1f02f3985fc35aa1f1b515f25efa9d4d
3
+ size 130572072
vocab.json ADDED
The diff for this file is too large to render. See raw diff