carlesoctav
commited on
Add SetFit model
Browse files- 1_Pooling/config.json +10 -0
- README.md +316 -0
- config.json +24 -0
- config_sentence_transformers.json +9 -0
- config_setfit.json +7 -0
- model.safetensors +3 -0
- model_head.pkl +3 -0
- modules.json +14 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +66 -0
- vocab.txt +0 -0
1_Pooling/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 768,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": true,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
7 |
+
"pooling_mode_weightedmean_tokens": false,
|
8 |
+
"pooling_mode_lasttoken": false,
|
9 |
+
"include_prompt": true
|
10 |
+
}
|
README.md
ADDED
@@ -0,0 +1,316 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
language: en
|
3 |
+
license: apache-2.0
|
4 |
+
library_name: setfit
|
5 |
+
tags:
|
6 |
+
- setfit
|
7 |
+
- sentence-transformers
|
8 |
+
- text-classification
|
9 |
+
- generated_from_setfit_trainer
|
10 |
+
metrics:
|
11 |
+
- accuracy
|
12 |
+
- precision
|
13 |
+
- recall
|
14 |
+
- f1
|
15 |
+
widget:
|
16 |
+
- text: not so jolly dolly so, last weekend my wife and i watched the oppen part of
|
17 |
+
the "barbenheimer" 2023 box-office two-headed monster and this week it was barbie's
|
18 |
+
turn. from the little i'd incidentally read in advance about the day-glo billion
|
19 |
+
dollar blockbuster, i was expecting some kind of retro-cool, existentialist, post-modernist
|
20 |
+
satire on the battle of the sexes, consumerism and childhood buffed up with a
|
21 |
+
little diversity along the way, but somehow with all these ducks lined up in a
|
22 |
+
row, i felt the film missed the mark.it starts brightly with eye-candy sets in
|
23 |
+
fifty shades of pink as we're introduced to margot robbie's barbie in her barbie-world
|
24 |
+
of alternative barbies, see through doll's houses and their various incomplete
|
25 |
+
consumer goods, for example our girl has her daily dry-shower and drinks non-existent
|
26 |
+
tea. everything appears to be perfect in her / their perfect world, unless you're
|
27 |
+
the boyfriend ken, here also in a variety of forms, all doomed to exist only in
|
28 |
+
barbie's slipstream and so experience recurring frustration at getting precisely
|
29 |
+
nowhere, all the time, with the object of his / their, i hesitate to call it,
|
30 |
+
desire.then things start to go wrong for robbie's "stereotypical" barbie. she
|
31 |
+
thinks of death and starts to malfunction and after a visit to kate mckinnon's
|
32 |
+
weird barbie, a concept i have to say i didn't get at all, she determines to go
|
33 |
+
to the real world to connect with the disillusioned mattel employee, played by
|
34 |
+
america ferrera, whose negativity, channelled through her disinterested daughter
|
35 |
+
ariana greenblatt, is upsetting the living doll's equilibrium. ryan gosling's
|
36 |
+
wheedling ken is also along for the ride and stows away in her penelope pitstop-mobile
|
37 |
+
and together they head for l. a., where ferrera lives, the headquarters of the
|
38 |
+
manufacturer mattel.for me, the film went downhill fast from there with ken's
|
39 |
+
head getting messed-up with perceptions of patriarchy while barbie has a meltdown
|
40 |
+
over her identity-crisis. there are unfunny, over-played scenes where barbie experiences
|
41 |
+
humiliation at the hands of greenblatt and her school chums, traipses down to
|
42 |
+
mattel hq to confront the all-male board of directors headed by a mis-cast will
|
43 |
+
ferrell as the company ceo, before returning to barbie-world with ferrera and
|
44 |
+
greenblatt in tow to take down ken's new-model kendom where outdated male-superiority
|
45 |
+
is literally back in the saddle.i have to admit, i got very bored, very soon with
|
46 |
+
this empty, supposedly satirical high-concept, fantasy-comedy. a world box-office
|
47 |
+
of 1.5 billion dollars and eight oscar nominations actually makes me wonder if
|
48 |
+
i've not switched places too with barbie-world as i'm afraid nothing about the
|
49 |
+
movie, including the soundtrack and unsuccessful attempts at either comedy or
|
50 |
+
pathos (especially when they wheel in rhea perlman as the doll's now-enlightened
|
51 |
+
creator) all missing me by miles.when at one point, all her namesakes shout "go
|
52 |
+
barbie!', i must admit i was with them 100% but for completely different reasons.
|
53 |
+
- text: way better than expected i was amongst the people who thought they saw a majority
|
54 |
+
of this film based on all of the filming stills posted on the bird app in 2022.
|
55 |
+
i still wanted to see it. something about their perfect neon rollerblading outfits.
|
56 |
+
i saw one preview and wasn't sure what the plot was going to be, i didn't care,
|
57 |
+
i still wanted to see it. i wasn't expecting it to be amazing, but amazing it
|
58 |
+
was. well done!! margot really knocked it out of the dollhouse. ryan i'll never
|
59 |
+
look at the same way way again. this 1980s barbie superman is very pleased. it
|
60 |
+
won't be long until the opening dance scene is all over the clock app. i haven't
|
61 |
+
felt so compelled to learn choreography since michael jackson's thriller. also,
|
62 |
+
girls rule. sorry, ken. 12 out of 24 found this helpful. was this review helpful?
|
63 |
+
sign in to vote. permalink
|
64 |
+
- text: 'anyone remember the film "life size"? from a far, i can see why people would
|
65 |
+
absolutely hate this movie. just the concept of "barbie: the movie" is enough
|
66 |
+
to make people feel like the art of cinema has been compromised by corporate america.
|
67 |
+
but, as a whole, this movie was very well received. it made over a billion dollars
|
68 |
+
at the box-office and was nominated for 8 oscars including "best picture", so
|
69 |
+
clearly it some people really liked it.there is a lot to enjoy in this film. the
|
70 |
+
movie does a good job with poking fun at the barbie brand without it feeling too
|
71 |
+
much like a spoof. this is a comedy, so the fact that the film is really funny
|
72 |
+
is kind of an important element. understandably comedy is a subjective thing,
|
73 |
+
so all i can say is for me, i laughed out loud several times through the movie.
|
74 |
+
the movie is clever in how it treats its "worldbuilding" and nicely avoids any
|
75 |
+
firm answers about how this world works. because, yeah, if you think about that
|
76 |
+
sort of stuff in the film there is a lot that doesn''t add up.it is nice that
|
77 |
+
they don''t spend too much time in "the real world" and focus on the creative
|
78 |
+
fun of "barbie world". the movie is more visually unique and can do more gags
|
79 |
+
when that is the case.when the movie is focusing on being a bizarre comedy, that
|
80 |
+
is when some of the best and most memorable things happen. when it tries to have
|
81 |
+
a more serious message, that is where it loses some momentum. don''t misunderstand
|
82 |
+
me, the movie needs some serious stuff in order to make the comedy work. and the
|
83 |
+
stuff with ugly betty and her daughter is good emotional stuff. but towards the
|
84 |
+
end, they realize that barbie needs to have a character arc and feel like they
|
85 |
+
tack one on last second. there are some very funny jokes towards the end, but
|
86 |
+
it does become a little repetitive and the message feels heavy handed by the 5th
|
87 |
+
time it''s brought up. side note: i wanted a cameo from the voice actress of barbie,
|
88 |
+
kelly sheridan, but she wasn''t there.i will emphasize this because hollywood
|
89 |
+
will learn all the wrong lessons from this movie''s success. we do not want a
|
90 |
+
"polly pocket" movie or an "uno" movie. what made this film a success, beyond
|
91 |
+
its brand or its marketing campaign, is that it was uniquely greta gerwig''s vision.
|
92 |
+
the movie wasn''t concerned with mass audience appeal, it would tell jokes that
|
93 |
+
they thought were funny and hoped others would enjoy as well. if you want to duplicate
|
94 |
+
barbie''s success, give creative people control to make some out there stuff.wrapped
|
95 |
+
in plastic, it''s fantastic.'
|
96 |
+
- text: great expectations this film exceeded all of my expectations a n d i was looking
|
97 |
+
forward to seeing it. i wonder about any parents who might bring their children
|
98 |
+
to see it expecting something quite different from what this film is. one hour
|
99 |
+
fifty four minutes of fun from beginning to end. satire, sarcasm , humor at every
|
100 |
+
turn. production values and acting off the charts good. i can't believe mattel
|
101 |
+
let them make the movie with complete artistic freedom. think of nicole kidman
|
102 |
+
in the amc promo before a movie starts and says, " somehow heartbreak feels good
|
103 |
+
in a place like this ". well somehow watching a silly spoof like this movie feels
|
104 |
+
great all the way through and even afterwards. i loved it and i am not surprised
|
105 |
+
at the huge box office , this movie rocks. 4 out of 11 found this helpful. was
|
106 |
+
this review helpful? sign in to vote. permalink
|
107 |
+
- text: decent i like what they did with this movie and the characters with its combining
|
108 |
+
the barbie world and the real world. barbie starts getting "vibes" and has to
|
109 |
+
go into the real world to find the girl who played with her to set things right
|
110 |
+
and winds up in the mattel headquarters. something resembling chaos ensues. ken
|
111 |
+
joins her and winds up causing further damage. i like what they do in various
|
112 |
+
stages of the story and with the characters. it was overall a very pleasant surprise
|
113 |
+
snd a good movie with a good cast. margot robbie, ryan gosling, america ferrera,
|
114 |
+
and will ferrell were all good in their roles. if you are a movie and/or a barbie
|
115 |
+
fan, you will love this movie.*** out of **** 2 out of 7 found this helpful. was
|
116 |
+
this review helpful? sign in to vote. permalink
|
117 |
+
pipeline_tag: text-classification
|
118 |
+
inference: true
|
119 |
+
model-index:
|
120 |
+
- name: SetFit
|
121 |
+
results:
|
122 |
+
- task:
|
123 |
+
type: text-classification
|
124 |
+
name: Text Classification
|
125 |
+
dataset:
|
126 |
+
name: data/raw/barbie.jsonl
|
127 |
+
type: unknown
|
128 |
+
split: test
|
129 |
+
metrics:
|
130 |
+
- type: accuracy
|
131 |
+
value: 0.8811688311688312
|
132 |
+
name: Accuracy
|
133 |
+
- type: precision
|
134 |
+
value: 0.9952114924181963
|
135 |
+
name: Precision
|
136 |
+
- type: recall
|
137 |
+
value: 0.8757022471910112
|
138 |
+
name: Recall
|
139 |
+
- type: f1
|
140 |
+
value: 0.9316398954053045
|
141 |
+
name: F1
|
142 |
+
---
|
143 |
+
|
144 |
+
# SetFit
|
145 |
+
|
146 |
+
This is a [SetFit](https://github.com/huggingface/setfit) model that can be used for Text Classification. A [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance is used for classification.
|
147 |
+
|
148 |
+
The model has been trained using an efficient few-shot learning technique that involves:
|
149 |
+
|
150 |
+
1. Fine-tuning a [Sentence Transformer](https://www.sbert.net) with contrastive learning.
|
151 |
+
2. Training a classification head with features from the fine-tuned Sentence Transformer.
|
152 |
+
|
153 |
+
## Model Details
|
154 |
+
|
155 |
+
### Model Description
|
156 |
+
- **Model Type:** SetFit
|
157 |
+
<!-- - **Sentence Transformer:** [Unknown](https://huggingface.co/unknown) -->
|
158 |
+
- **Classification head:** a [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance
|
159 |
+
- **Maximum Sequence Length:** 512 tokens
|
160 |
+
- **Number of Classes:** 2 classes
|
161 |
+
<!-- - **Training Dataset:** [Unknown](https://huggingface.co/datasets/unknown) -->
|
162 |
+
- **Language:** en
|
163 |
+
- **License:** apache-2.0
|
164 |
+
|
165 |
+
### Model Sources
|
166 |
+
|
167 |
+
- **Repository:** [SetFit on GitHub](https://github.com/huggingface/setfit)
|
168 |
+
- **Paper:** [Efficient Few-Shot Learning Without Prompts](https://arxiv.org/abs/2209.11055)
|
169 |
+
- **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
|
170 |
+
|
171 |
+
### Model Labels
|
172 |
+
| Label | Examples |
|
173 |
+
|:---------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
174 |
+
| negative | <ul><li>"definitely not for kids i've just taken 2 nieces, 9 and 14, to see barbie. they both hated it... really, really hated it!! and, me: i'm just stunned. i've no idea what i've just seen.if barbie is meant to be a dark satire, it's alright. if it's meant to be a kids movie, it's unconscionably bad. and, i'm totally confused which type of movie it's supposed to be. what the literal heck is going on!!if you're looking for a twenty first century dark cultural satire, you're at least in your twenties, you've an open mind, this is your movie... maybe. if you're looking for a movie to take your kids to, before getting ice cream, this is absolutely not the movie you're looking for. my advice: give barbie a miss and go straight for the ice cream. you will be so much happier. i wish i had. 15 out of 30 found this helpful. was this review helpful? sign in to vote. permalink"</li><li>"the most political movie i've ever seen. i loved the effort with the sets and the fun outfits. i also really enjoyed the ads threw out movie.i was really enjoying this movie but then it started getting really political, i was kind of fine with it but then they started making politics the whole story line and so it was really no longer a fun movie. after the movie finished i just ended up leaving miserable and like i waisted money... how is a family meant to enjoy this?? i can't see any 13 year old understanding anything they talk about.also they want to talk about how being a human is hard and that were not perfect but then they hire someone to play a teen girl who has perfect hair and skin. a bit of a confusing message? 180 out of 276 found this helpful. was this review helpful? sign in to vote. permalink"</li><li>"mediocre at best i had high expectations as a result of the media press, however these we're crushed from the start.first of all, i did expect it to feel a little generic and cheesy although all i could feel throughout the movie is that it was rushed and cheap. the storyline was dry and over-political.i'd have liked to see more lgbtq+ representation and breaking stereotypes, as it felt like just a generic film. even the barbies were considered stereotypes!comedy throughout was limited and wasn't engaging at all - sometimes trying too hard to emphasise feminism and going too far in the opposite direction to the world is heading in (i'm not encouraging patriarchy).however, i did find the music quite good (especially the billie eilish song) and did redeem the movie a little bit.in summary, the movie was mediocre at best and there's not much to discuss. it felt like a cheap version of movies like spirited and the greatest showman with no real emotion."</li></ul> |
|
175 |
+
| positive | <ul><li>"fabulously done so, i didn't have that much of a high expectation going in to see this because i really wasn't sure what is was going to be. i grew up playing barbie's and have watched the animated films many times with my kids.the movie from start to finish is so thoughtfully executed. it's for everyone, but mainly young girls need to see this. it's a great reminder of how special we are as women and how special all of us are individually as a person and the life we get to experience.another fantastic element is adding a very 90s feel to the film. you will laugh like you used to laugh when fun comedies would come out in theatre's years ago. i haven't seen just a good comedy with heart in years.i brought my 7yr old and we dressed up for it too. i wanted her to see me comfortable in my own skin and her as well and the film touches on that. it's suited for any age, regardless of the rating.i don't give high ratings like this to films usually, as i find small things usually that i wish had been addressed more... but not in barbie. what a fun movie and a great time you'll have watching this in theatre (or at home) knowing it's your childhood come to life."</li><li>"sure, life in plastic is fantastic but only in barbieland the barbie movie was unexpected. it was a colorful and clever ride in the cinema. i was not expecting all the deep emotions that the film gave. life is not all about perfection, which a lot of people wants to constantly achieve these days, imperfections is what identifies us and that's okay.i'm a visual kind of cinema goer and i have the say that dance sequence (dance the night) and the scene where barbie and ken where traveling to the real world were amazing. kudos to the creative team behind it, i absolutely adore the set.greta gerwig and her team delivered a visual spectacle with a heart. 10 out of 28 found this helpful. was this review helpful? sign in to vote. permalink"</li><li>"funny with social commentary barbie (margot robbie) lives in barbieland. ken (ryan gosling) is always desperate for her attention. all the ken and barbie dolls live in a happy matriarchy unaware of the real world. out of the blue, barbie starts pondering death and her existence. weird barbie (kate mckinnon) tells her that she has opened a portal to the real world and must fix whatever is her real world problem before she can return to her perfect self. she and stowaway ken find the real world completely different than their expectations. mattel ceo (will ferrell) insists on putting her back in the box. mattel secretary gloria (america ferrera) had caused the problem by drawing new forms of barbie.first, i love the premise and i love the 2001 opening. the start is a lot funnier than i expected. margot robbie is great and ryan gosling is hilarious. it's a great start in barbieland. the first moments in la is a little too much. quite frankly, barbie and ken would not stand out at venice beach. the male leering is good enough. they don't need to do the stereotype abusive guys. the real world should be realistic. barbie and ken would be better fishes out of the water in a recognizable regular world. the more average the real world is, the better it is for the characters to showcase their outrageousness.mattel is fun and i like the ridiculous silliness. will ferrell is a good way to show their outrageous quality. the movie has a lot of social commentary and that aspect does threaten to overwhelm it. the last act has some wonky moments as the movie tries to wrap its arms around the heavier social discussions. i would like to keep that more contained and concentrate on the mother daughter relationships. it's gloria and sasha, but it's also ruth and barbara. that's a perfect way to end the movie. i do like the montage idea, but i didn't realize what it was doing initially. it would have been fine to do that for the closing credits. all in all, this is a funny engaging movie and it's able to deal with some of the tougher social material."</li></ul> |
|
176 |
+
|
177 |
+
## Evaluation
|
178 |
+
|
179 |
+
### Metrics
|
180 |
+
| Label | Accuracy | Precision | Recall | F1 |
|
181 |
+
|:--------|:---------|:----------|:-------|:-------|
|
182 |
+
| **all** | 0.8812 | 0.9952 | 0.8757 | 0.9316 |
|
183 |
+
|
184 |
+
## Uses
|
185 |
+
|
186 |
+
### Direct Use for Inference
|
187 |
+
|
188 |
+
First install the SetFit library:
|
189 |
+
|
190 |
+
```bash
|
191 |
+
pip install setfit
|
192 |
+
```
|
193 |
+
|
194 |
+
Then you can load this model and run inference.
|
195 |
+
|
196 |
+
```python
|
197 |
+
from setfit import SetFitModel
|
198 |
+
|
199 |
+
# Download from the 🤗 Hub
|
200 |
+
model = SetFitModel.from_pretrained("carlesoctav/SentimentClassifierBarbieDune-8shot")
|
201 |
+
# Run inference
|
202 |
+
preds = model("decent i like what they did with this movie and the characters with its combining the barbie world and the real world. barbie starts getting \"vibes\" and has to go into the real world to find the girl who played with her to set things right and winds up in the mattel headquarters. something resembling chaos ensues. ken joins her and winds up causing further damage. i like what they do in various stages of the story and with the characters. it was overall a very pleasant surprise snd a good movie with a good cast. margot robbie, ryan gosling, america ferrera, and will ferrell were all good in their roles. if you are a movie and/or a barbie fan, you will love this movie.*** out of **** 2 out of 7 found this helpful. was this review helpful? sign in to vote. permalink")
|
203 |
+
```
|
204 |
+
|
205 |
+
<!--
|
206 |
+
### Downstream Use
|
207 |
+
|
208 |
+
*List how someone could finetune this model on their own dataset.*
|
209 |
+
-->
|
210 |
+
|
211 |
+
<!--
|
212 |
+
### Out-of-Scope Use
|
213 |
+
|
214 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
215 |
+
-->
|
216 |
+
|
217 |
+
<!--
|
218 |
+
## Bias, Risks and Limitations
|
219 |
+
|
220 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
221 |
+
-->
|
222 |
+
|
223 |
+
<!--
|
224 |
+
### Recommendations
|
225 |
+
|
226 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
227 |
+
-->
|
228 |
+
|
229 |
+
## Training Details
|
230 |
+
|
231 |
+
### Training Set Metrics
|
232 |
+
| Training set | Min | Median | Max |
|
233 |
+
|:-------------|:----|:---------|:-----|
|
234 |
+
| Word count | 112 | 234.1953 | 1424 |
|
235 |
+
|
236 |
+
| Label | Training Sample Count |
|
237 |
+
|:---------|:----------------------|
|
238 |
+
| negative | 64 |
|
239 |
+
| positive | 64 |
|
240 |
+
|
241 |
+
### Training Hyperparameters
|
242 |
+
- batch_size: (16, 16)
|
243 |
+
- num_epochs: (1, 1)
|
244 |
+
- max_steps: -1
|
245 |
+
- sampling_strategy: oversampling
|
246 |
+
- body_learning_rate: (2e-05, 1e-05)
|
247 |
+
- head_learning_rate: 0.01
|
248 |
+
- loss: CosineSimilarityLoss
|
249 |
+
- distance_metric: cosine_distance
|
250 |
+
- margin: 0.25
|
251 |
+
- end_to_end: False
|
252 |
+
- use_amp: False
|
253 |
+
- warmup_proportion: 0.1
|
254 |
+
- seed: 42
|
255 |
+
- eval_max_steps: -1
|
256 |
+
- load_best_model_at_end: True
|
257 |
+
|
258 |
+
### Training Results
|
259 |
+
| Epoch | Step | Training Loss | Validation Loss |
|
260 |
+
|:-------:|:-------:|:-------------:|:---------------:|
|
261 |
+
| 0.0019 | 1 | 0.3627 | - |
|
262 |
+
| 0.0962 | 50 | 0.0007 | - |
|
263 |
+
| 0.1923 | 100 | 0.1003 | - |
|
264 |
+
| 0.2885 | 150 | 0.0001 | - |
|
265 |
+
| 0.3846 | 200 | 0.0001 | - |
|
266 |
+
| 0.4808 | 250 | 0.0001 | - |
|
267 |
+
| 0.5769 | 300 | 0.0001 | - |
|
268 |
+
| 0.6731 | 350 | 0.0 | - |
|
269 |
+
| 0.7692 | 400 | 0.0001 | - |
|
270 |
+
| 0.8654 | 450 | 0.0 | - |
|
271 |
+
| 0.9615 | 500 | 0.0 | - |
|
272 |
+
| **1.0** | **520** | **-** | **0.2312** |
|
273 |
+
|
274 |
+
* The bold row denotes the saved checkpoint.
|
275 |
+
### Framework Versions
|
276 |
+
- Python: 3.10.11
|
277 |
+
- SetFit: 1.0.3
|
278 |
+
- Sentence Transformers: 2.5.1
|
279 |
+
- Transformers: 4.38.2
|
280 |
+
- PyTorch: 2.0.1
|
281 |
+
- Datasets: 2.18.0
|
282 |
+
- Tokenizers: 0.15.2
|
283 |
+
|
284 |
+
## Citation
|
285 |
+
|
286 |
+
### BibTeX
|
287 |
+
```bibtex
|
288 |
+
@article{https://doi.org/10.48550/arxiv.2209.11055,
|
289 |
+
doi = {10.48550/ARXIV.2209.11055},
|
290 |
+
url = {https://arxiv.org/abs/2209.11055},
|
291 |
+
author = {Tunstall, Lewis and Reimers, Nils and Jo, Unso Eun Seo and Bates, Luke and Korat, Daniel and Wasserblat, Moshe and Pereg, Oren},
|
292 |
+
keywords = {Computation and Language (cs.CL), FOS: Computer and information sciences, FOS: Computer and information sciences},
|
293 |
+
title = {Efficient Few-Shot Learning Without Prompts},
|
294 |
+
publisher = {arXiv},
|
295 |
+
year = {2022},
|
296 |
+
copyright = {Creative Commons Attribution 4.0 International}
|
297 |
+
}
|
298 |
+
```
|
299 |
+
|
300 |
+
<!--
|
301 |
+
## Glossary
|
302 |
+
|
303 |
+
*Clearly define terms in order to be accessible across audiences.*
|
304 |
+
-->
|
305 |
+
|
306 |
+
<!--
|
307 |
+
## Model Card Authors
|
308 |
+
|
309 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
310 |
+
-->
|
311 |
+
|
312 |
+
<!--
|
313 |
+
## Model Card Contact
|
314 |
+
|
315 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
316 |
+
-->
|
config.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "exp/Dune2Classifier64shot/step_520",
|
3 |
+
"architectures": [
|
4 |
+
"MPNetModel"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 3072,
|
14 |
+
"layer_norm_eps": 1e-05,
|
15 |
+
"max_position_embeddings": 514,
|
16 |
+
"model_type": "mpnet",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"pad_token_id": 1,
|
20 |
+
"relative_attention_num_buckets": 32,
|
21 |
+
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.38.2",
|
23 |
+
"vocab_size": 30527
|
24 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"__version__": {
|
3 |
+
"sentence_transformers": "2.0.0",
|
4 |
+
"transformers": "4.7.0",
|
5 |
+
"pytorch": "1.9.0+cu102"
|
6 |
+
},
|
7 |
+
"prompts": {},
|
8 |
+
"default_prompt_name": null
|
9 |
+
}
|
config_setfit.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"normalize_embeddings": false,
|
3 |
+
"labels": [
|
4 |
+
"negative",
|
5 |
+
"positive"
|
6 |
+
]
|
7 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab2da127bc3afdc7345786f19cfa0b797c882977a7117012968c03179bc3ef7c
|
3 |
+
size 437967672
|
model_head.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c66f517ee30db960dece161133ad096dcab2caf2a1c58e8f6ca037aaa5470b5
|
3 |
+
size 6997
|
modules.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
}
|
14 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 512,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"cls_token": {
|
10 |
+
"content": "<s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"eos_token": {
|
17 |
+
"content": "</s>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"mask_token": {
|
24 |
+
"content": "<mask>",
|
25 |
+
"lstrip": true,
|
26 |
+
"normalized": false,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
},
|
30 |
+
"pad_token": {
|
31 |
+
"content": "<pad>",
|
32 |
+
"lstrip": false,
|
33 |
+
"normalized": false,
|
34 |
+
"rstrip": false,
|
35 |
+
"single_word": false
|
36 |
+
},
|
37 |
+
"sep_token": {
|
38 |
+
"content": "</s>",
|
39 |
+
"lstrip": false,
|
40 |
+
"normalized": false,
|
41 |
+
"rstrip": false,
|
42 |
+
"single_word": false
|
43 |
+
},
|
44 |
+
"unk_token": {
|
45 |
+
"content": "[UNK]",
|
46 |
+
"lstrip": false,
|
47 |
+
"normalized": false,
|
48 |
+
"rstrip": false,
|
49 |
+
"single_word": false
|
50 |
+
}
|
51 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "<s>",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "<pad>",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "</s>",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"104": {
|
28 |
+
"content": "[UNK]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"30526": {
|
36 |
+
"content": "<mask>",
|
37 |
+
"lstrip": true,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"bos_token": "<s>",
|
45 |
+
"clean_up_tokenization_spaces": true,
|
46 |
+
"cls_token": "<s>",
|
47 |
+
"do_basic_tokenize": true,
|
48 |
+
"do_lower_case": true,
|
49 |
+
"eos_token": "</s>",
|
50 |
+
"mask_token": "<mask>",
|
51 |
+
"max_length": 512,
|
52 |
+
"model_max_length": 512,
|
53 |
+
"never_split": null,
|
54 |
+
"pad_to_multiple_of": null,
|
55 |
+
"pad_token": "<pad>",
|
56 |
+
"pad_token_type_id": 0,
|
57 |
+
"padding_side": "right",
|
58 |
+
"sep_token": "</s>",
|
59 |
+
"stride": 0,
|
60 |
+
"strip_accents": null,
|
61 |
+
"tokenize_chinese_chars": true,
|
62 |
+
"tokenizer_class": "MPNetTokenizer",
|
63 |
+
"truncation_side": "right",
|
64 |
+
"truncation_strategy": "longest_first",
|
65 |
+
"unk_token": "[UNK]"
|
66 |
+
}
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|