diff --git a/DATASET_CARD.md b/DATASET_CARD.md new file mode 100644 index 0000000..98e7464 --- /dev/null +++ b/DATASET_CARD.md @@ -0,0 +1,172 @@ +--- +dataset_info: +- config_name: all-samples + features: + - name: id + dtype: string + - name: title + dtype: string + - name: original_context + dtype: string + - name: question + dtype: string + - name: answers + struct: + - name: answer_start + sequence: int64 + - name: text + sequence: string + - name: validation + dtype: string + - name: context + dtype: string + splits: + - name: train + num_bytes: 55875621 + num_examples: 10001 + download_size: 6994468 + dataset_size: 55875621 +- config_name: default + features: + - name: id + dtype: string + - name: title + dtype: string + - name: question + dtype: string + - name: answers + struct: + - name: answer_start + sequence: int64 + - name: text + sequence: string + - name: validation + dtype: string + - name: context + dtype: string + splits: + - name: train + num_bytes: 2187382 + num_examples: 848 + - name: val + num_bytes: 347924 + num_examples: 128 + - name: test + num_bytes: 2487219 + num_examples: 1024 + download_size: 2042697 + dataset_size: 5022525 +- config_name: incorrect-samples + features: + - name: id + dtype: string + - name: title + dtype: string + - name: question + dtype: string + - name: answers + struct: + - name: answer_start + sequence: int64 + - name: text + sequence: string + - name: validation + dtype: string + - name: context + dtype: string + splits: + - name: train + num_bytes: 6241697 + num_examples: 2395 + download_size: 1492991 + dataset_size: 6241697 +configs: +- config_name: all-samples + data_files: + - split: train + path: all-samples/train-* +- config_name: default + data_files: + - split: train + path: data/train-* + - split: val + path: data/val-* + - split: test + path: data/test-* +- config_name: incorrect-samples + data_files: + - split: train + path: incorrect-samples/train-* +license: cc-by-nc-4.0 +task_categories: +- question-answering +language: +- fo +pretty_name: FoQA +size_categories: +- 1K