davidberenstein1957 HF staff commited on
Commit
0c1d5b6
·
1 Parent(s): 93f233e

update the multi labelling prompt

Browse files
src/synthetic_dataset_generator/apps/textcat.py CHANGED
@@ -105,7 +105,7 @@ def generate_dataset(
105
  is_sample=is_sample,
106
  )
107
  labeller_generator = get_labeller_generator(
108
- system_prompt=f"{system_prompt} {', '.join(labels)}",
109
  labels=labels,
110
  multi_label=multi_label,
111
  )
@@ -134,7 +134,6 @@ def generate_dataset(
134
  else:
135
  k = 1
136
 
137
- print(k)
138
  sampled_labels = random.sample(labels, min(k, len(labels)))
139
  random.shuffle(sampled_labels)
140
  inputs.append(
 
105
  is_sample=is_sample,
106
  )
107
  labeller_generator = get_labeller_generator(
108
+ system_prompt=f"{system_prompt}. Potential labels: {', '.join(labels)}",
109
  labels=labels,
110
  multi_label=multi_label,
111
  )
 
134
  else:
135
  k = 1
136
 
 
137
  sampled_labels = random.sample(labels, min(k, len(labels)))
138
  random.shuffle(sampled_labels)
139
  inputs.append(