-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathrun.sh
57 lines (46 loc) · 1.7 KB
/
run.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#!/bin/bash
# Main runner script for all files
# Author : Prateek & Nishant
#PREPARING DATA
echo "preparing data..."
sleep 1
cd data
./download_airline.sh
./download_weather.sh
wget http://stat-computing.org/dataexpo/2009/airports.csv
wget http://stat-computing.org/dataexpo/2009/carriers.csv
echo "All data downloaded.. Now merging data..."
sleep 1
#Merging files
python merge.py 1997
python merge.py 1998
python merge.py 1999
python merge.py 2000
python merge.py 2001
python merge.py 2002
python merge.py 2003
python merge.py 2004
python merge.py 2005
python merge.py 2006
echo "Fetiching some random data to do our task.."
sleep 1
#Random
python pick_random.py 10000 merged1997.csv merged1998.csv merged1999.csv merged2000.csv merged2001.csv merged2002.csv merged2003.csv merged2004.csv merged2005.csv merged2006.csv
python pick_random.py 100000 merged1997.csv merged1998.csv merged1999.csv merged2000.csv merged2001.csv merged2002.csv merged2003.csv merged2004.csv merged2005.csv merged2006.csv
python pick_random.py 1000000 merged1997.csv merged1998.csv merged1999.csv merged2000.csv merged2001.csv merged2002.csv merged2003.csv merged2004.csv merged2005.csv merged2006.csv
echo "randomdata generated.. cleaning other data now"
rm merged*
rm -rf airline_data
rm -rf weather
echo "Filtering data now.."
sleep 1
#Filtering
python filter_columns.py randomoutput_10000.csv filtered_10000.csv
python filter_columns.py randomoutput_100000.csv filtered_100000.csv
python filter_columns.py randomoutput_1000000.csv filtered_1000000.csv
#TRAINING AND TESTING MODEL NOW
cd ../
echo "Training data now"
python train.py ./data/filtered_1000000.py
echo "The model is trained now.."
echo "You may now test the data using python test.py"