Push model using huggingface_hub.
Browse files- README.md +10 -11
- config.json +1 -1
- config_setfit.json +2 -2
- model.safetensors +1 -1
- model_head.pkl +1 -1
README.md
CHANGED
@@ -189,7 +189,7 @@ model-index:
|
|
189 |
split: test
|
190 |
metrics:
|
191 |
- type: accuracy
|
192 |
-
value: 0.
|
193 |
name: Accuracy
|
194 |
---
|
195 |
|
@@ -272,7 +272,7 @@ The model has been trained using an efficient few-shot learning technique that i
|
|
272 |
### Metrics
|
273 |
| Label | Accuracy |
|
274 |
|:--------|:---------|
|
275 |
-
| **all** | 0.
|
276 |
|
277 |
## Uses
|
278 |
|
@@ -373,8 +373,8 @@ preds = model("##rch procedure that evaluates the objective function p x display
|
|
373 |
| 42 | 10 |
|
374 |
|
375 |
### Training Hyperparameters
|
376 |
-
- batch_size: (
|
377 |
-
- num_epochs: (
|
378 |
- max_steps: -1
|
379 |
- sampling_strategy: oversampling
|
380 |
- num_iterations: 10
|
@@ -383,7 +383,7 @@ preds = model("##rch procedure that evaluates the objective function p x display
|
|
383 |
- loss: CosineSimilarityLoss
|
384 |
- distance_metric: cosine_distance
|
385 |
- margin: 0.25
|
386 |
-
- end_to_end:
|
387 |
- use_amp: False
|
388 |
- warmup_proportion: 0.1
|
389 |
- max_length: 512
|
@@ -392,13 +392,12 @@ preds = model("##rch procedure that evaluates the objective function p x display
|
|
392 |
- load_best_model_at_end: True
|
393 |
|
394 |
### Training Results
|
395 |
-
| Epoch
|
396 |
-
|
397 |
-
| 0.
|
398 |
-
| 0.
|
399 |
-
|
|
400 |
|
401 |
-
* The bold row denotes the saved checkpoint.
|
402 |
### Framework Versions
|
403 |
- Python: 3.10.12
|
404 |
- SetFit: 1.0.3
|
|
|
189 |
split: test
|
190 |
metrics:
|
191 |
- type: accuracy
|
192 |
+
value: 0.009170806266717615
|
193 |
name: Accuracy
|
194 |
---
|
195 |
|
|
|
272 |
### Metrics
|
273 |
| Label | Accuracy |
|
274 |
|:--------|:---------|
|
275 |
+
| **all** | 0.0092 |
|
276 |
|
277 |
## Uses
|
278 |
|
|
|
373 |
| 42 | 10 |
|
374 |
|
375 |
### Training Hyperparameters
|
376 |
+
- batch_size: (16, 16)
|
377 |
+
- num_epochs: (2, 2)
|
378 |
- max_steps: -1
|
379 |
- sampling_strategy: oversampling
|
380 |
- num_iterations: 10
|
|
|
383 |
- loss: CosineSimilarityLoss
|
384 |
- distance_metric: cosine_distance
|
385 |
- margin: 0.25
|
386 |
+
- end_to_end: True
|
387 |
- use_amp: False
|
388 |
- warmup_proportion: 0.1
|
389 |
- max_length: 512
|
|
|
392 |
- load_best_model_at_end: True
|
393 |
|
394 |
### Training Results
|
395 |
+
| Epoch | Step | Training Loss | Validation Loss |
|
396 |
+
|:------:|:----:|:-------------:|:---------------:|
|
397 |
+
| 0.0019 | 1 | 0.2819 | - |
|
398 |
+
| 0.9294 | 500 | 0.0065 | - |
|
399 |
+
| 1.8587 | 1000 | 0.0049 | - |
|
400 |
|
|
|
401 |
### Framework Versions
|
402 |
- Python: 3.10.12
|
403 |
- SetFit: 1.0.3
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "/
|
3 |
"architectures": [
|
4 |
"MPNetModel"
|
5 |
],
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "sentence-transformers/multi-qa-mpnet-base-cos-v1",
|
3 |
"architectures": [
|
4 |
"MPNetModel"
|
5 |
],
|
config_setfit.json
CHANGED
@@ -1,4 +1,4 @@
|
|
1 |
{
|
2 |
-
"
|
3 |
-
"
|
4 |
}
|
|
|
1 |
{
|
2 |
+
"normalize_embeddings": false,
|
3 |
+
"labels": null
|
4 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437967672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eec439124102164c3c1a5bbc6de59fe41985f69e76b329dff470ac7ca4f1828b
|
3 |
size 437967672
|
model_head.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 133831
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6bf911016819125cb55ddf71d5dd24d0e86ded4047eb0cef0fd7fc460ee7d2a
|
3 |
size 133831
|