Path: blob/master/4 - Natural Language Processing with Attention Models/Week 3/data/squad/plain_text/1.0.0/dataset_info.json
65 views
{1"citation": "@article{2016arXiv160605250R,\n author = {{Rajpurkar}, Pranav and {Zhang}, Jian and {Lopyrev},\n Konstantin and {Liang}, Percy},\n title = \"{SQuAD: 100,000+ Questions for Machine Comprehension of Text}\",\n journal = {arXiv e-prints},\n year = 2016,\n eid = {arXiv:1606.05250},\n pages = {arXiv:1606.05250},\narchivePrefix = {arXiv},\n eprint = {1606.05250},\n}",2"description": "Stanford Question Answering Dataset (SQuAD) is a reading comprehension dataset, consisting of questions posed by crowdworkers on a set of Wikipedia articles, where the answer to every question is a segment of text, or span, from the corresponding reading passage, or the question might be unanswerable.",3"downloadSize": "35142551",4"location": {5"urls": [6"https://rajpurkar.github.io/SQuAD-explorer/"7]8},9"name": "squad",10"schema": {11"feature": [12{13"name": "answers"14},15{16"name": "context",17"type": "BYTES"18},19{20"name": "id",21"type": "BYTES"22},23{24"name": "question",25"type": "BYTES"26},27{28"name": "title",29"type": "BYTES"30}31]32},33"sizeInBytes": "35142551",34"splits": [35{36"name": "train",37"numShards": "10",38"shardLengths": [39"87599"40],41"statistics": {42"features": [43{44"bytesStats": {45"commonStats": {46"numNonMissing": "87599"47}48},49"name": "context",50"type": "BYTES"51},52{53"bytesStats": {54"commonStats": {55"numNonMissing": "87599"56}57},58"name": "id",59"type": "BYTES"60},61{62"bytesStats": {63"commonStats": {64"numNonMissing": "87599"65}66},67"name": "question",68"type": "BYTES"69},70{71"bytesStats": {72"commonStats": {73"numNonMissing": "87599"74}75},76"name": "title",77"type": "BYTES"78}79],80"numExamples": "87599"81}82},83{84"name": "validation",85"numShards": "1",86"shardLengths": [87"10570"88],89"statistics": {90"features": [91{92"bytesStats": {93"commonStats": {94"numNonMissing": "10570"95}96},97"name": "context",98"type": "BYTES"99},100{101"bytesStats": {102"commonStats": {103"numNonMissing": "10570"104}105},106"name": "id",107"type": "BYTES"108},109{110"bytesStats": {111"commonStats": {112"numNonMissing": "10570"113}114},115"name": "question",116"type": "BYTES"117},118{119"bytesStats": {120"commonStats": {121"numNonMissing": "10570"122}123},124"name": "title",125"type": "BYTES"126}127],128"numExamples": "10570"129}130}131],132"version": "1.0.0"133}134135