Update BM25S model
Browse files- README.md +3 -3
- corpus.jsonl +2 -2
- corpus.mmindex.json +0 -0
- data.csc.index.npy +2 -2
- indices.csc.index.npy +2 -2
- indptr.csc.index.npy +2 -2
- params.index.json +1 -1
- vocab.index.json +2 -2
README.md
CHANGED
@@ -123,9 +123,9 @@ This dataset was created using the following data:
|
|
123 |
|
124 |
| Statistic | Value |
|
125 |
| --- | --- |
|
126 |
-
| Number of documents |
|
127 |
-
| Number of tokens |
|
128 |
-
| Average tokens per document | 8.
|
129 |
|
130 |
## Parameters
|
131 |
|
|
|
123 |
|
124 |
| Statistic | Value |
|
125 |
| --- | --- |
|
126 |
+
| Number of documents | 362841 |
|
127 |
+
| Number of tokens | 2975453 |
|
128 |
+
| Average tokens per document | 8.2 |
|
129 |
|
130 |
## Parameters
|
131 |
|
corpus.jsonl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f53137b4941dda5acc77bc9aaf71e87674bfdd8c0e210f7da39835929823189
|
3 |
+
size 31663181
|
corpus.mmindex.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
data.csc.index.npy
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2f9838d0102b28876970161fa72ef842c60e8745dd855a336d95f4c5cab5694
|
3 |
+
size 11901940
|
indices.csc.index.npy
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8f216e8ad4aa8d8a5842155212809db8f6271b634722a72b23493087b2d8f12
|
3 |
+
size 11901940
|
indptr.csc.index.npy
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:241b5484c5bb54f67b0b0d04b3e6d3d09a669c44c57f0ca6ed03ea630abcb43d
|
3 |
+
size 577168
|
params.index.json
CHANGED
@@ -6,7 +6,7 @@
|
|
6 |
"idf_method": "lucene",
|
7 |
"dtype": "float32",
|
8 |
"int_dtype": "int32",
|
9 |
-
"num_docs":
|
10 |
"version": "0.2.6",
|
11 |
"backend": "numpy"
|
12 |
}
|
|
|
6 |
"idf_method": "lucene",
|
7 |
"dtype": "float32",
|
8 |
"int_dtype": "int32",
|
9 |
+
"num_docs": 362841,
|
10 |
"version": "0.2.6",
|
11 |
"backend": "numpy"
|
12 |
}
|
vocab.index.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1d934afdf72d46521d9543421eda21214c8dcbf975c20f20841c0e63e13ce8e
|
3 |
+
size 2437143
|