-
Notifications
You must be signed in to change notification settings - Fork 9
/
setup_data.sh
32 lines (27 loc) · 1.04 KB
/
setup_data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
#!/bin/bash
# source: https://github.com/microsoft/deep-language-networks/blob/main/scripts/setup_data.sh
# Create data folder
mkdir -p data
# Get Ordered Prompt data (including Trec & mpqa)
wget https://github.com/yaolu/Ordered-Prompt/archive/refs/heads/main.zip
unzip main.zip
mv Ordered-Prompt-main/data data/ordered_prompt
rm -rf Ordered-Prompt-main
rm -f main.zip
# Get Leopard data (including disaster)
wget https://github.com/iesl/leopard/archive/refs/heads/master.zip
unzip master.zip
mv leopard-master/data/json data/leopard
rm -rf leopard-master
rm -f master.zip
# # Get BBH data
# wget https://github.com/suzgunmirac/BIG-Bench-Hard/archive/refs/heads/main.zip
# unzip main.zip
# mv BIG-Bench-Hard-main/bbh data/
# rm -rf BIG-Bench-Hard-main
# rm -f main.zip
# # Preprocess BBH data removing points from BigBench to avoid data contamination
# python scripts/split_bigbench_date_understanding.py
# python scripts/split_bigbench_hyperbaton.py
# python scripts/split_bigbench_logical_deduction_seven_objects.py
# python scripts/split_bigbench_navigate.py