{ | |
"builder_name": "json", | |
"citation": "", | |
"config_name": "default", | |
"dataset_name": "json", | |
"dataset_size": 2816740545, | |
"description": "", | |
"download_checksums": { | |
"/home/manojale/Documents/Data/commit_data_8m_ready_to_feed.jsonl": { | |
"num_bytes": 3110715617, | |
"checksum": null | |
} | |
}, | |
"download_size": 3110715617, | |
"features": { | |
"input_ids": { | |
"feature": { | |
"dtype": "int32", | |
"_type": "Value" | |
}, | |
"_type": "Sequence" | |
}, | |
"attention_mask": { | |
"feature": { | |
"dtype": "int8", | |
"_type": "Value" | |
}, | |
"_type": "Sequence" | |
}, | |
"word_ids": { | |
"feature": { | |
"dtype": "int64", | |
"_type": "Value" | |
}, | |
"_type": "Sequence" | |
}, | |
"labels": { | |
"feature": { | |
"dtype": "int64", | |
"_type": "Value" | |
}, | |
"_type": "Sequence" | |
} | |
}, | |
"homepage": "", | |
"license": "", | |
"size_in_bytes": 5927456162, | |
"splits": { | |
"train": { | |
"name": "train", | |
"num_bytes": 2816740545, | |
"num_examples": 8345771, | |
"shard_lengths": [ | |
1461651, | |
1509932, | |
1500137, | |
1478094, | |
1517113, | |
878844 | |
], | |
"dataset_name": "json" | |
} | |
}, | |
"version": { | |
"version_str": "0.0.0", | |
"major": 0, | |
"minor": 0, | |
"patch": 0 | |
} | |
} |