|
{
|
|
"builder_name": "google_wellformed_query",
|
|
"citation": "@misc{faruqui2018identifying,\n title={Identifying Well-formed Natural Language Questions},\n author={Manaal Faruqui and Dipanjan Das},\n year={2018},\n eprint={1808.09419},\n archivePrefix={arXiv},\n primaryClass={cs.CL}\n}\n",
|
|
"config_name": "default",
|
|
"dataset_name": "google_wellformed_query",
|
|
"dataset_size": 1230988,
|
|
"description": "Google's query wellformedness dataset was created by crowdsourcing well-formedness annotations for 25,100 queries from the Paralex corpus. Every query was annotated by five raters each with 1/0 rating of whether or not the query is well-formed.\n",
|
|
"download_checksums": {
|
|
"https://raw.githubusercontent.com/google-research-datasets/query-wellformedness/master/train.tsv": {
|
|
"num_bytes": 805818,
|
|
"checksum": null
|
|
},
|
|
"https://raw.githubusercontent.com/google-research-datasets/query-wellformedness/master/test.tsv": {
|
|
"num_bytes": 178070,
|
|
"checksum": null
|
|
},
|
|
"https://raw.githubusercontent.com/google-research-datasets/query-wellformedness/master/dev.tsv": {
|
|
"num_bytes": 173131,
|
|
"checksum": null
|
|
}
|
|
},
|
|
"download_size": 1157019,
|
|
"features": {
|
|
"rating": {
|
|
"dtype": "float32",
|
|
"_type": "Value"
|
|
},
|
|
"content": {
|
|
"dtype": "string",
|
|
"_type": "Value"
|
|
}
|
|
},
|
|
"homepage": "https://github.com/google-research-datasets/query-wellformedness",
|
|
"license": "",
|
|
"size_in_bytes": 2388007,
|
|
"splits": {
|
|
"train": {
|
|
"name": "train",
|
|
"num_bytes": 857383,
|
|
"num_examples": 17500,
|
|
"dataset_name": "google_wellformed_query"
|
|
},
|
|
"test": {
|
|
"name": "test",
|
|
"num_bytes": 189499,
|
|
"num_examples": 3850,
|
|
"dataset_name": "google_wellformed_query"
|
|
},
|
|
"validation": {
|
|
"name": "validation",
|
|
"num_bytes": 184106,
|
|
"num_examples": 3750,
|
|
"dataset_name": "google_wellformed_query"
|
|
}
|
|
},
|
|
"version": {
|
|
"version_str": "0.0.0",
|
|
"major": 0,
|
|
"minor": 0,
|
|
"patch": 0
|
|
}
|
|
} |