-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathget_data.sh
executable file
·102 lines (88 loc) · 2.6 KB
/
get_data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
#!/bin/bash
if [ 3 == 4 ]; then
#-----------------------------------------------------------------------------#
#---- Get OHG dataset
#-----------------------------------------------------------------------------#
cd data/OHG/
#--- size approx 16.3GB
wget https://zenodo.org/record/1322666/files/OHG.tar.gz
tar -xvf OHG.tar.gz
rm OHG.tar.gz
mkdir data
mv b0* data/.
mkdir train val test
cd train
for f in $(<../train.lst); do
ln -s ../data/b0*/${f}.tif .
ln -s ../data/b0*/page/${f}.xml .
done
cd ../val
for f in $(<../val.lst); do
ln -s ../data/b0*/${f}.tif .
ln -s ../data/b0*/page/${f}.xml .
done
cd ../test
for f in $(<../test.lst); do
ln -s ../data/b0*/${f}.tif .
ln -s ../data/b0*/page/${f}.xml .
done
cd ../../..
fi
#-----------------------------------------------------------------------------#
#---- FCR dataset has to be requested to the owners, hence no automatic
# download is available, set-up equires data/FCR/data/ to exists
#-----------------------------------------------------------------------------#
cd data/FCR/
#--- size approx. 1.2GB
wget https://zenodo.org/record/3945088/files/FCR_500.tar.gz
tar -xvf FCR_500.tar.gz
rm FCR_500.tar.gz
mv FCR_500/data .
mkdir train val test
cd train
for f in $(<../train.lst); do
ln -s ../data/${f}* .
ln -s ../data/page/${f}* .
done
cd ../val
for f in $(<../val.lst); do
ln -s ../data/${f}* .
ln -s ../data/page/${f}* .
done
cd ../test
for f in $(<../test.lst); do
ln -s ../data/${f}* .
ln -s ../data/page/${f}* .
done
cd ../../../
exit
#-----------------------------------------------------------------------------#
#---- Get ABP dataset
#-----------------------------------------------------------------------------#
cd data/ABP
#--- size approx 590MB
wget https://zenodo.org/record/1243098/files/READ_ABP_TABLE.zip
unzip READ_ABP_TABLE.zip
rm READ_ABP_TABLE.zip
mv READ_ABP_TABLE/ data
mkdir train val test
cd train
for f in $(<../train.lst); do
ln -s ../data/dataset111/img/${f}.* .
ln -s ../data/dataset111/xml/${f}.xml .
done
cd ../val
for f in $(<../val.lst); do
ln -s ../data/dataset111/img/${f}.* .
ln -s ../data/dataset111/xml/${f}.xml .
done
cd ../test
for f in $(<../test.lst); do
ln -s ../data/dataset111/img/${f}.* .
ln -s ../data/dataset111/xml/${f}.xml .
done
cd ../../../
#-----------------------------------------------------------------------------#
#-----------------------------------------------------------------------------#
#-----------------------------------------------------------------------------#
#-----------------------------------------------------------------------------#