v0.22 - 2025-04-02 01:24:14 UTC - retrain-pipelines v0.1.1 - Upload model and tokenizer with README.
Browse files- README.md +97 -31
- adapter_config.json +2 -2
- adapter_model.safetensors +1 -1
- runs/cpt/{events.out.tfevents.1741969186.2d70a17da09c.4767.0 → events.out.tfevents.1743531404.6cdc632317b8.7103.0} +2 -2
- runs/sft/{events.out.tfevents.1741970569.2d70a17da09c.11273.0 → events.out.tfevents.1743532821.6cdc632317b8.13713.0} +2 -2
README.md
CHANGED
@@ -3,9 +3,9 @@
|
|
3 |
# @see https://huggingface.co/docs/huggingface_hub/guides/model-cards#update-metadata
|
4 |
# @see https://huggingface.co/docs/hub/model-cards#model-card-metadata
|
5 |
|
6 |
-
version: '0.
|
7 |
|
8 |
-
timestamp: '
|
9 |
|
10 |
model_name: retrain-pipelines Function Caller
|
11 |
|
@@ -49,7 +49,7 @@ widget:
|
|
49 |
output:
|
50 |
text: '[{"name": "is_perfect_square", "arguments": {"num": 49}}]'
|
51 |
|
52 |
-
mf_run_id: '
|
53 |
|
54 |
# @see https://huggingface.co/docs/huggingface_hub/guides/model-cards#include-evaluation-results
|
55 |
# @see https://huggingface.co/docs/huggingface_hub/main/en/package_reference/cards#huggingface_hub.EvalResult
|
@@ -63,52 +63,118 @@ model-index:
|
|
63 |
name: retrain-pipelines Function Calling
|
64 |
type: retrain-pipelines/func_calls_ds
|
65 |
split: validation
|
66 |
-
revision:
|
67 |
metrics:
|
68 |
- type: precision
|
69 |
-
value: 0.
|
70 |
- type: recall
|
71 |
-
value: 0.
|
72 |
- type: f1
|
73 |
-
value: 0.
|
74 |
- type: jaccard
|
75 |
-
value: 0.
|
76 |
|
77 |
---
|
78 |
|
79 |
-
|
80 |
-
|
81 |
-
|
82 |
-
|
83 |
-
|
84 |
-
|
85 |
-
|
86 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
87 |
|
88 |
Training dataset :
|
89 |
-
- <code>retrain-pipelines/func_calls_ds v0.
|
90 |
-
(<a href="https://huggingface.co/datasets/retrain-pipelines/func_calls_ds/blob/
|
91 |
-
target="_blank">
|
92 |
-
2025-
|
|
|
|
|
93 |
|
94 |
Base model :
|
95 |
- <code>unsloth/Qwen2.5-1.5B</code>
|
96 |
(<a href="https://huggingface.co/unsloth/Qwen2.5-1.5B/blob/2d0a015faee2c1af360a6725a30c4d7a258ac4d4/README.md"
|
97 |
target="_blank">2d0a015</a> -
|
98 |
-
2025-02-06 02:32:14 UTC)
|
|
|
|
|
99 |
arxiv :<br />
|
100 |
- <code><a href="https://huggingface.co/papers/2407.10671"
|
101 |
target="_blank">2407.10671</a></code><br />
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
102 |
<br />
|
103 |
<br />
|
104 |
-
<br />
|
105 |
-
<br />
|
106 |
-
<br />
|
107 |
|
108 |
-
<
|
109 |
-
|
110 |
-
|
111 |
-
|
112 |
-
|
113 |
-
|
114 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
# @see https://huggingface.co/docs/huggingface_hub/guides/model-cards#update-metadata
|
4 |
# @see https://huggingface.co/docs/hub/model-cards#model-card-metadata
|
5 |
|
6 |
+
version: '0.22'
|
7 |
|
8 |
+
timestamp: '20250402_012414955_UTC'
|
9 |
|
10 |
model_name: retrain-pipelines Function Caller
|
11 |
|
|
|
49 |
output:
|
50 |
text: '[{"name": "is_perfect_square", "arguments": {"num": 49}}]'
|
51 |
|
52 |
+
mf_run_id: '92'
|
53 |
|
54 |
# @see https://huggingface.co/docs/huggingface_hub/guides/model-cards#include-evaluation-results
|
55 |
# @see https://huggingface.co/docs/huggingface_hub/main/en/package_reference/cards#huggingface_hub.EvalResult
|
|
|
63 |
name: retrain-pipelines Function Calling
|
64 |
type: retrain-pipelines/func_calls_ds
|
65 |
split: validation
|
66 |
+
revision: 8d4dacf6095dc0ef2702d58dfeaa36b730dece00
|
67 |
metrics:
|
68 |
- type: precision
|
69 |
+
value: 0.7514837980270386
|
70 |
- type: recall
|
71 |
+
value: 0.7512756586074829
|
72 |
- type: f1
|
73 |
+
value: 0.7511526346206665
|
74 |
- type: jaccard
|
75 |
+
value: 0.7329407334327698
|
76 |
|
77 |
---
|
78 |
|
79 |
+
<div
|
80 |
+
class="
|
81 |
+
p-6 mb-4 rounded-lg
|
82 |
+
pt-6 sm:pt-9
|
83 |
+
bg-gradient-to-b
|
84 |
+
from-purple-500
|
85 |
+
dark:from-purple-500/20
|
86 |
+
"
|
87 |
+
>
|
88 |
+
<div
|
89 |
+
class="
|
90 |
+
pl-4 rounded-lg
|
91 |
+
border-2 border-gray-100
|
92 |
+
bg-gradient-to-b
|
93 |
+
from-purple-500
|
94 |
+
dark:from-purple-500/20
|
95 |
+
"
|
96 |
+
>
|
97 |
+
<b>retrain-pipelines Function Caller</b>
|
98 |
+
</div>
|
99 |
+
<code>version 0.22</code> - <code>2025-04-02 01:24:14 UTC</code>
|
100 |
+
(retraining
|
101 |
+
<a target="_blank"
|
102 |
+
href="https://huggingface.co/retrain-pipelines/function_caller_lora/tree/retrain-pipelines_source-code/v0.22_20250402_012414955_UTC">source-code</a> |
|
103 |
+
<a target="_blank"
|
104 |
+
href="https://huggingface.co/spaces/retrain-pipelines/online_pipeline_card_renderer/?model_repo_id=retrain-pipelines/function_caller_lora&version_id=v0.22_20250402_012414955_UTC">pipeline-card</a>)
|
105 |
+
</div>
|
106 |
|
107 |
Training dataset :
|
108 |
+
- <code>retrain-pipelines/func_calls_ds v0.20</code>
|
109 |
+
(<a href="https://huggingface.co/datasets/retrain-pipelines/func_calls_ds/blob/8d4dacf6095dc0ef2702d58dfeaa36b730dece00/README.md"
|
110 |
+
target="_blank">8d4dacf</a> -
|
111 |
+
2025-04-01 18:12:25 UTC)
|
112 |
+
<br />
|
113 |
+
<img alt="" src="https://img.shields.io/badge/dynamic/json?url=https%3A%2F%2Fhuggingface.co%2Fapi%2Fdatasets%2Fretrain-pipelines/func_calls_ds&query=%24.downloads&logo=huggingface&label=downloads" class="inline-block" /> <img alt="" src="https://img.shields.io/badge/dynamic/json?url=https%3A%2F%2Fhuggingface.co%2Fapi%2Fdatasets%2Fretrain-pipelines/func_calls_ds&query=%24.likes&logo=huggingface&label=likes" class="inline-block" />
|
114 |
|
115 |
Base model :
|
116 |
- <code>unsloth/Qwen2.5-1.5B</code>
|
117 |
(<a href="https://huggingface.co/unsloth/Qwen2.5-1.5B/blob/2d0a015faee2c1af360a6725a30c4d7a258ac4d4/README.md"
|
118 |
target="_blank">2d0a015</a> -
|
119 |
+
2025-02-06 02:32:14 UTC)
|
120 |
+
<br />
|
121 |
+
<img alt="" src="https://img.shields.io/badge/dynamic/json?url=https%3A%2F%2Fhuggingface.co%2Fapi%2Fmodels%2Funsloth/Qwen2.5-1.5B&query=%24.downloads&logo=huggingface&label=downloads" class="inline-block" /> <img alt="" src="https://img.shields.io/badge/dynamic/json?url=https%3A%2F%2Fhuggingface.co%2Fapi%2Fmodels%2Funsloth/Qwen2.5-1.5B&query=%24.likes&logo=huggingface&label=likes" class="inline-block" /><br />
|
122 |
arxiv :<br />
|
123 |
- <code><a href="https://huggingface.co/papers/2407.10671"
|
124 |
target="_blank">2407.10671</a></code><br />
|
125 |
+
The herein LoRa adapter can for instance be used as follows :<br />
|
126 |
+
```python
|
127 |
+
from transformers import AutoModelForCausalLM, AutoTokenizer
|
128 |
+
from torch import device, cuda
|
129 |
+
|
130 |
+
repo_id = "retrain-pipelines/function_caller_lora"
|
131 |
+
revision = "<model_revision_commit_hash>"
|
132 |
+
model = AutoModelForCausalLM.from_pretrained(
|
133 |
+
repo_id, revision=revision, torch_dtype="auto", device_map="auto")
|
134 |
+
tokenizer = AutoTokenizer.from_pretrained(
|
135 |
+
repo_id, revision=revision, torch_dtype="auto", device_map="auto")
|
136 |
+
|
137 |
+
device = device("cuda" if cuda.is_available() else "cpu")
|
138 |
+
def generate_tool_calls_list(query, max_new_tokens=400) -> str:
|
139 |
+
formatted_query = tokenizer.chat_template.format(query, "")
|
140 |
+
inputs = tokenizer(formatted_query, return_tensors="pt").input_ids.to(device)
|
141 |
+
outputs = model.generate(inputs, max_new_tokens=max_new_tokens, do_sample=False)
|
142 |
+
generated_text = tokenizer.batch_decode(outputs, skip_special_tokens=True)[0]
|
143 |
+
return generated_text[len(formatted_query):].strip()
|
144 |
+
|
145 |
+
generate_tool_calls_list("Is 49 a perfect square ?")
|
146 |
+
```
|
147 |
+
|
148 |
<br />
|
149 |
<br />
|
|
|
|
|
|
|
150 |
|
151 |
+
<div
|
152 |
+
class="
|
153 |
+
p-6 mb-4 rounded-lg
|
154 |
+
pt-6 sm:pt-9
|
155 |
+
px-4
|
156 |
+
pb-1
|
157 |
+
bg-gradient-to-t
|
158 |
+
from-purple-500
|
159 |
+
dark:from-purple-500/20
|
160 |
+
"
|
161 |
+
>
|
162 |
+
<div
|
163 |
+
class="
|
164 |
+
p-6 mb-4 rounded-lg
|
165 |
+
border-2 border-gray-100
|
166 |
+
pt-6 sm:pt-9
|
167 |
+
bg-gradient-to-t
|
168 |
+
from-purple-500
|
169 |
+
dark:from-purple-500/20
|
170 |
+
"
|
171 |
+
>
|
172 |
+
Powered by
|
173 |
+
<code><a target="_blank"
|
174 |
+
href="https://github.com/aurelienmorgan/retrain-pipelines">retrain-pipelines
|
175 |
+
0.1.1</a></code> -
|
176 |
+
<code>Run by <a target="_blank" href="https://huggingface.co/Aurelien-Morgan-Bot">Aurelien-Morgan-Bot</a></code> -
|
177 |
+
<em><b>UnslothFuncCallFlow</b></em> - mf_run_id : <code>92</code>
|
178 |
+
</div>
|
179 |
+
</div>
|
180 |
+
|
adapter_config.json
CHANGED
@@ -26,12 +26,12 @@
|
|
26 |
"rank_pattern": {},
|
27 |
"revision": null,
|
28 |
"target_modules": [
|
|
|
29 |
"up_proj",
|
30 |
"v_proj",
|
31 |
-
"gate_proj",
|
32 |
"q_proj",
|
33 |
-
"down_proj",
|
34 |
"k_proj",
|
|
|
35 |
"o_proj"
|
36 |
],
|
37 |
"task_type": "CAUSAL_LM",
|
|
|
26 |
"rank_pattern": {},
|
27 |
"revision": null,
|
28 |
"target_modules": [
|
29 |
+
"gate_proj",
|
30 |
"up_proj",
|
31 |
"v_proj",
|
|
|
32 |
"q_proj",
|
|
|
33 |
"k_proj",
|
34 |
+
"down_proj",
|
35 |
"o_proj"
|
36 |
],
|
37 |
"task_type": "CAUSAL_LM",
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2457916480
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cae66f633a344d4997113e2850297009196be57c880d99b5591b0e33627b330f
|
3 |
size 2457916480
|
runs/cpt/{events.out.tfevents.1741969186.2d70a17da09c.4767.0 → events.out.tfevents.1743531404.6cdc632317b8.7103.0}
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b0dc87504b3ed4546e908c26d5ea48a471d2c37ba1a4c65956229563c25c2d2
|
3 |
+
size 61059
|
runs/sft/{events.out.tfevents.1741970569.2d70a17da09c.11273.0 → events.out.tfevents.1743532821.6cdc632317b8.13713.0}
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22fa8e22b31dded99b6c8932d162b1dd82f2f92c953b9284946c64c66e759158
|
3 |
+
size 1007718
|