Spaces:
Paused
Paused
nit
Browse files
src/calibration_datasets.py
CHANGED
@@ -214,6 +214,7 @@ class CalibrationDataset(ABC):
|
|
214 |
|
215 |
class WikitextDataset(CalibrationDataset):
|
216 |
dataset = "wikitext"
|
|
|
217 |
dataset_config = {
|
218 |
"path": "wikitext",
|
219 |
"name": "wikitext-103-raw-v1",
|
@@ -221,11 +222,11 @@ class WikitextDataset(CalibrationDataset):
|
|
221 |
}
|
222 |
dataset_name = "Wikitext103 Full"
|
223 |
|
224 |
-
def process_samples(self) -> List[str]:
|
225 |
-
|
226 |
-
|
227 |
-
|
228 |
-
|
229 |
|
230 |
|
231 |
class C4Dataset(CalibrationDataset):
|
|
|
214 |
|
215 |
class WikitextDataset(CalibrationDataset):
|
216 |
dataset = "wikitext"
|
217 |
+
dataset_field = "text"
|
218 |
dataset_config = {
|
219 |
"path": "wikitext",
|
220 |
"name": "wikitext-103-raw-v1",
|
|
|
222 |
}
|
223 |
dataset_name = "Wikitext103 Full"
|
224 |
|
225 |
+
# def process_samples(self) -> List[str]:
|
226 |
+
# return [
|
227 |
+
# "\n" if len(item) == 0 else item
|
228 |
+
# for item in self.data["text"]
|
229 |
+
# ]
|
230 |
|
231 |
|
232 |
class C4Dataset(CalibrationDataset):
|