Add SetFit model
Browse files- README.md +26 -20
- config_sentence_transformers.json +2 -2
- config_setfit.json +2 -2
- model.safetensors +1 -1
- model_head.pkl +1 -1
README.md
CHANGED
@@ -74,7 +74,7 @@ model-index:
|
|
74 |
split: test
|
75 |
metrics:
|
76 |
- type: accuracy
|
77 |
-
value: 0.
|
78 |
name: Accuracy
|
79 |
---
|
80 |
|
@@ -106,17 +106,17 @@ The model has been trained using an efficient few-shot learning technique that i
|
|
106 |
- **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
|
107 |
|
108 |
### Model Labels
|
109 |
-
| Label | Examples
|
110 |
-
|
111 |
-
|
|
112 |
-
|
|
113 |
|
114 |
## Evaluation
|
115 |
|
116 |
### Metrics
|
117 |
| Label | Accuracy |
|
118 |
|:--------|:---------|
|
119 |
-
| **all** | 0.
|
120 |
|
121 |
## Uses
|
122 |
|
@@ -171,16 +171,16 @@ Final evaluation:")
|
|
171 |
### Training Set Metrics
|
172 |
| Training set | Min | Median | Max |
|
173 |
|:-------------|:----|:--------|:----|
|
174 |
-
| Word count |
|
175 |
|
176 |
| Label | Training Sample Count |
|
177 |
|:------|:----------------------|
|
178 |
-
| 0 |
|
179 |
-
| 1 |
|
180 |
|
181 |
### Training Hyperparameters
|
182 |
- batch_size: (16, 16)
|
183 |
-
- num_epochs: (
|
184 |
- max_steps: -1
|
185 |
- sampling_strategy: oversampling
|
186 |
- num_iterations: 20
|
@@ -200,21 +200,27 @@ Final evaluation:")
|
|
200 |
### Training Results
|
201 |
| Epoch | Step | Training Loss | Validation Loss |
|
202 |
|:------:|:----:|:-------------:|:---------------:|
|
203 |
-
| 0.
|
204 |
-
| 0.
|
205 |
-
| 0.
|
206 |
-
| 0.
|
207 |
-
|
|
208 |
-
|
|
209 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
210 |
|
211 |
### Framework Versions
|
212 |
- Python: 3.10.14
|
213 |
- SetFit: 1.1.0
|
214 |
-
- Sentence Transformers: 3.1.
|
215 |
- Transformers: 4.44.0
|
216 |
-
- PyTorch: 2.4.
|
217 |
-
- Datasets:
|
218 |
- Tokenizers: 0.19.1
|
219 |
|
220 |
## Citation
|
|
|
74 |
split: test
|
75 |
metrics:
|
76 |
- type: accuracy
|
77 |
+
value: 0.7611940298507462
|
78 |
name: Accuracy
|
79 |
---
|
80 |
|
|
|
106 |
- **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
|
107 |
|
108 |
### Model Labels
|
109 |
+
| Label | Examples |
|
110 |
+
|:------|:----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
111 |
+
| 1 | <ul><li>'Reasoning:\nhallucination - The answer introduces information that is not found in the document, which indicates that it is hallucinating.\nEvaluation:'</li><li>'Reasoning:\nThe answer provided is mostly aligned with the content of the document, discussing pulse checking as a rough method to estimate if systolic blood pressure is relatively normal. However, the mention of checking after moderate activity seems slightly misrepresented compared to the source material. The source also provides minor additional context and disclaimers that the answer partially addresses.\n\nFinal Evaluation:'</li><li>"Reasoning:\n- Well-Supported: The answer correctly explains the flexibility in holidays, including the 4-6 weeks off, the requirement for a 2-week consecutive break, and the need for clear communication, which stems from the documents.\n- Specificity: The answer provides specific details about the holiday policy at ORGANIZATION, reflecting what's stated in the document.\n- Conciseness: The answer is clear and to the point, covering all the necessary aspects of the flexible holiday policy without unnecessary details.\n\nEvaluation:"</li></ul> |
|
112 |
+
| 0 | <ul><li>'Reasoning:\nirrelevant - The answer provided does not relate to the document or the specific question asked.\nEvaluation:'</li><li>'Reasoning:\nThe given answer sufficiently explains the referral bonus structure, including specific amounts for typical and difficult-to-fill roles, eligibility criteria, and the referral process. It also mentions that certain roles (e.g., hiring managers) are excluded from receiving bonuses.\n\nEvaluation:'</li><li>"Reasoning:\ncontext grounding - The answer is well-supported by the document, although some specific points, such as drinking ice water, weren't explicitly mentioned.\nrelevance - The answer is directly related to the specific question asked.\nconciseness - While the answer is quite detailed, it remains focused and does not deviate into unrelated topics, making it concise enough given the context.\n\nEvaluation:"</li></ul> |
|
113 |
|
114 |
## Evaluation
|
115 |
|
116 |
### Metrics
|
117 |
| Label | Accuracy |
|
118 |
|:--------|:---------|
|
119 |
+
| **all** | 0.7612 |
|
120 |
|
121 |
## Uses
|
122 |
|
|
|
171 |
### Training Set Metrics
|
172 |
| Training set | Min | Median | Max |
|
173 |
|:-------------|:----|:--------|:----|
|
174 |
+
| Word count | 3 | 38.1107 | 148 |
|
175 |
|
176 |
| Label | Training Sample Count |
|
177 |
|:------|:----------------------|
|
178 |
+
| 0 | 111 |
|
179 |
+
| 1 | 133 |
|
180 |
|
181 |
### Training Hyperparameters
|
182 |
- batch_size: (16, 16)
|
183 |
+
- num_epochs: (1, 1)
|
184 |
- max_steps: -1
|
185 |
- sampling_strategy: oversampling
|
186 |
- num_iterations: 20
|
|
|
200 |
### Training Results
|
201 |
| Epoch | Step | Training Loss | Validation Loss |
|
202 |
|:------:|:----:|:-------------:|:---------------:|
|
203 |
+
| 0.0016 | 1 | 0.2275 | - |
|
204 |
+
| 0.0820 | 50 | 0.2535 | - |
|
205 |
+
| 0.1639 | 100 | 0.2094 | - |
|
206 |
+
| 0.2459 | 150 | 0.1707 | - |
|
207 |
+
| 0.3279 | 200 | 0.1085 | - |
|
208 |
+
| 0.4098 | 250 | 0.0439 | - |
|
209 |
+
| 0.4918 | 300 | 0.0268 | - |
|
210 |
+
| 0.5738 | 350 | 0.0129 | - |
|
211 |
+
| 0.6557 | 400 | 0.0256 | - |
|
212 |
+
| 0.7377 | 450 | 0.016 | - |
|
213 |
+
| 0.8197 | 500 | 0.0128 | - |
|
214 |
+
| 0.9016 | 550 | 0.0109 | - |
|
215 |
+
| 0.9836 | 600 | 0.0127 | - |
|
216 |
|
217 |
### Framework Versions
|
218 |
- Python: 3.10.14
|
219 |
- SetFit: 1.1.0
|
220 |
+
- Sentence Transformers: 3.1.1
|
221 |
- Transformers: 4.44.0
|
222 |
+
- PyTorch: 2.4.0+cu121
|
223 |
+
- Datasets: 3.0.0
|
224 |
- Tokenizers: 0.19.1
|
225 |
|
226 |
## Citation
|
config_sentence_transformers.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"__version__": {
|
3 |
-
"sentence_transformers": "3.1.
|
4 |
"transformers": "4.44.0",
|
5 |
-
"pytorch": "2.4.
|
6 |
},
|
7 |
"prompts": {},
|
8 |
"default_prompt_name": null,
|
|
|
1 |
{
|
2 |
"__version__": {
|
3 |
+
"sentence_transformers": "3.1.1",
|
4 |
"transformers": "4.44.0",
|
5 |
+
"pytorch": "2.4.0+cu121"
|
6 |
},
|
7 |
"prompts": {},
|
8 |
"default_prompt_name": null,
|
config_setfit.json
CHANGED
@@ -1,4 +1,4 @@
|
|
1 |
{
|
2 |
-
"
|
3 |
-
"
|
4 |
}
|
|
|
1 |
{
|
2 |
+
"labels": null,
|
3 |
+
"normalize_embeddings": false
|
4 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437951328
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c49a7a24588072d2710874c643a2db5e20fdce42c20e85928f35589a53668978
|
3 |
size 437951328
|
model_head.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7007
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0c6ddbbda48b1288974be33614b39ef266863f4addbc5cc33f2ab0a8f788b20
|
3 |
size 7007
|