Skip to content

Commit

Permalink
Add files via upload
Browse files Browse the repository at this point in the history
  • Loading branch information
andrew-yuhochi authored Jun 25, 2022
1 parent f0b0e0f commit cff6e1a
Show file tree
Hide file tree
Showing 30 changed files with 416 additions and 0 deletions.
1 change: 1 addition & 0 deletions clean_data/PoC_10Q_DatasetDict/dataset_dict.json
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"splits": ["train", "validation", "test"]}
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file added clean_data/PoC_10Q_DatasetDict/test/dataset.arrow
Binary file not shown.
50 changes: 50 additions & 0 deletions clean_data/PoC_10Q_DatasetDict/test/dataset_info.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,50 @@
{
"builder_name": null,
"citation": "",
"config_name": null,
"dataset_size": null,
"description": "",
"download_checksums": null,
"download_size": null,
"features": {
"Domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Sub domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Intent": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"value": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"labels": {
"feature": {
"dtype": "int64",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"homepage": "",
"license": "",
"post_processed": null,
"post_processing_size": null,
"size_in_bytes": null,
"splits": null,
"supervised_keys": null,
"task_templates": null,
"version": null
}
14 changes: 14 additions & 0 deletions clean_data/PoC_10Q_DatasetDict/test/state.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
{
"_data_files": [
{
"filename": "dataset.arrow"
}
],
"_fingerprint": "48d3ebc4320f1460",
"_format_columns": null,
"_format_kwargs": {},
"_format_type": null,
"_indexes": {},
"_output_all_columns": false,
"_split": null
}
Binary file not shown.
Binary file not shown.
50 changes: 50 additions & 0 deletions clean_data/PoC_10Q_DatasetDict/train/dataset_info.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,50 @@
{
"builder_name": null,
"citation": "",
"config_name": null,
"dataset_size": null,
"description": "",
"download_checksums": null,
"download_size": null,
"features": {
"Domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Sub domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Intent": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"value": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"labels": {
"feature": {
"dtype": "int64",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"homepage": "",
"license": "",
"post_processed": null,
"post_processing_size": null,
"size_in_bytes": null,
"splits": null,
"supervised_keys": null,
"task_templates": null,
"version": null
}
14 changes: 14 additions & 0 deletions clean_data/PoC_10Q_DatasetDict/train/state.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
{
"_data_files": [
{
"filename": "dataset.arrow"
}
],
"_fingerprint": "2f19cdd385d5ca9d",
"_format_columns": null,
"_format_kwargs": {},
"_format_type": null,
"_indexes": {},
"_output_all_columns": false,
"_split": null
}
Binary file not shown.
Binary file not shown.
Binary file not shown.
50 changes: 50 additions & 0 deletions clean_data/PoC_10Q_DatasetDict/validation/dataset_info.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,50 @@
{
"builder_name": null,
"citation": "",
"config_name": null,
"dataset_size": null,
"description": "",
"download_checksums": null,
"download_size": null,
"features": {
"Domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Sub domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Intent": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"value": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"labels": {
"feature": {
"dtype": "int64",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"homepage": "",
"license": "",
"post_processed": null,
"post_processing_size": null,
"size_in_bytes": null,
"splits": null,
"supervised_keys": null,
"task_templates": null,
"version": null
}
14 changes: 14 additions & 0 deletions clean_data/PoC_10Q_DatasetDict/validation/state.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
{
"_data_files": [
{
"filename": "dataset.arrow"
}
],
"_fingerprint": "01297d791d4261c2",
"_format_columns": null,
"_format_kwargs": {},
"_format_type": null,
"_indexes": {},
"_output_all_columns": false,
"_split": null
}
1 change: 1 addition & 0 deletions clean_data/phase1_74Q_DatasetDict/dataset_dict.json
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"splits": ["train", "validation", "test"]}
Binary file not shown.
Binary file not shown.
Binary file not shown.
60 changes: 60 additions & 0 deletions clean_data/phase1_74Q_DatasetDict/test/dataset_info.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,60 @@
{
"builder_name": null,
"citation": "",
"config_name": null,
"dataset_size": null,
"description": "",
"download_checksums": null,
"download_size": null,
"features": {
"index": {
"dtype": "int64",
"id": null,
"_type": "Value"
},
"Domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Sub domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Intent": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Answer Format": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"value": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"labels": {
"feature": {
"dtype": "int64",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"homepage": "",
"license": "",
"post_processed": null,
"post_processing_size": null,
"size_in_bytes": null,
"splits": null,
"supervised_keys": null,
"task_templates": null,
"version": null
}
14 changes: 14 additions & 0 deletions clean_data/phase1_74Q_DatasetDict/test/state.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
{
"_data_files": [
{
"filename": "dataset.arrow"
}
],
"_fingerprint": "c2895b6836830173",
"_format_columns": null,
"_format_kwargs": {},
"_format_type": null,
"_indexes": {},
"_output_all_columns": false,
"_split": null
}
Binary file not shown.
Binary file not shown.
60 changes: 60 additions & 0 deletions clean_data/phase1_74Q_DatasetDict/train/dataset_info.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,60 @@
{
"builder_name": null,
"citation": "",
"config_name": null,
"dataset_size": null,
"description": "",
"download_checksums": null,
"download_size": null,
"features": {
"index": {
"dtype": "int64",
"id": null,
"_type": "Value"
},
"Domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Sub domain": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Intent": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Answer Format": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"value": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"labels": {
"feature": {
"dtype": "int64",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"homepage": "",
"license": "",
"post_processed": null,
"post_processing_size": null,
"size_in_bytes": null,
"splits": null,
"supervised_keys": null,
"task_templates": null,
"version": null
}
14 changes: 14 additions & 0 deletions clean_data/phase1_74Q_DatasetDict/train/state.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
{
"_data_files": [
{
"filename": "dataset.arrow"
}
],
"_fingerprint": "010701e0f50f2307",
"_format_columns": null,
"_format_kwargs": {},
"_format_type": null,
"_indexes": {},
"_output_all_columns": false,
"_split": null
}
Binary file not shown.
Binary file not shown.
Loading

0 comments on commit cff6e1a

Please sign in to comment.