gagan3012 commited on
Commit
150e8a6
1 Parent(s): ce90a9f

Update BM25S model

Browse files
.gitattributes CHANGED
@@ -34,3 +34,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  corpus.jsonl filter=lfs diff=lfs merge=lfs -text
 
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  corpus.jsonl filter=lfs diff=lfs merge=lfs -text
37
+ corpus.mmindex.json filter=lfs diff=lfs merge=lfs -text
38
+ vocab.index.json filter=lfs diff=lfs merge=lfs -text
corpus.jsonl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31622a65c6f640dd20ef06ae11e047ae31fc36cfc1661b8d6024903118bb42be
3
- size 12828151
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53b2c1279fa11854c81513b9876050e32da875a730ff4e0bd691fef1221609a8
3
+ size 7886931414
corpus.mmindex.json CHANGED
@@ -1 +1,3 @@
1
- [0, 17, 248870, 434425, 704171, 720829, 814097, 826099, 839148, 839971, 860563, 921857, 932264, 951625, 962636, 981499, 1284829, 1630369, 1893308, 2440883, 2534608, 2574014, 2585616, 2608258, 2747165, 2804036, 2805663, 2909631, 2972791, 3230011, 3424676, 3528910, 3617269, 3930692, 4067165, 4481847, 4673288, 4694356, 4735420, 5271972, 5296027, 5574720, 5624083, 5687027, 5754540, 5859397, 5953308, 5964901, 6067922, 6719333, 6781167, 6858550, 7047449, 7070212, 7174291, 7313382, 7406277, 7745701, 8415731, 8599210, 8697166, 8711120, 8734073, 8912157, 8930359, 9121870, 9122925, 9164282, 9512784, 9524043, 9616599, 9671839, 9692185, 9711197, 9753354, 9766935, 9821838, 9865045, 9998959, 10276843, 10327725, 10347944, 10449292, 10474401, 10489323, 10626711, 10867606, 10885422, 10902395, 11057647, 11514997, 11526521, 11584523, 11916307, 12226214, 12262873, 12344847, 12348098, 12349839, 12428236]
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fe1e2e09a3ca01f079f3502fc4a77bbe811630dce13c99e1c6bf18e1a616e00
3
+ size 13008476
data.csc.index.npy CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89e5a40f8256e07ffd672ab793c2becc0b1ec7e7c9351de3ae9beb252a772fcd
3
- size 503228
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5764b3f85910b585db43f1a2bb21e5495c177342b5afa6959b4fc9dce30b7b1
3
+ size 487051080
indices.csc.index.npy CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d48287a966b6551fed4ef1d41417983e1823694d66d91331c2e1b37044e28e0
3
- size 503228
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18c9814f2229649fe451e31dfa65bfd0da9f133aada1ca8eb3d2412515960320
3
+ size 487051080
indptr.csc.index.npy CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27c670565b72d40a0bf486723e6b18b5634cbb58d944d0f5b1d464839a1b59c0
3
- size 108152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:559927bb45a9f0ad1e629ee3f254c013c8c6d4db46ed460aae9e109168e0b30f
3
+ size 3767948
params.index.json CHANGED
@@ -6,6 +6,6 @@
6
  "idf_method": "lucene",
7
  "dtype": "float32",
8
  "int_dtype": "int32",
9
- "num_docs": 100,
10
  "version": "0.1.10"
11
  }
 
6
  "idf_method": "lucene",
7
  "dtype": "float32",
8
  "int_dtype": "int32",
9
+ "num_docs": 1087947,
10
  "version": "0.1.10"
11
  }
vocab.index.json CHANGED
The diff for this file is too large to render. See raw diff