This repository has been archived by the owner on Jan 29, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
spider.sh
67 lines (61 loc) · 1.69 KB
/
spider.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
#!/bin/bash
function the_hindu(){
echo "Cd to folder"
cd /home/runner/work/newspaper/newspaper
echo "in the folder"
#rm -f *.csv
scrapy crawl --nolog the_hindu #> the_hindu.log
echo "done"
#sed -e 's/,,/, ,/g' failed_to_download.csv | column -s , -t | cat
}
function bustd(){
echo "Cd to folder"
cd /home/runner/work/newspaper/newspaper
echo "in the folder"
#rm -f *.csv
scrapy crawl --nolog business_standard #> business_standard.log
echo "done"
#sed -e 's/,,/, ,/g' failed_to_download.csv | column -s , -t | cat
}
function etime(){
echo "Cd to folder"
cd /home/runner/work/newspaper/newspaper
echo "in the folder"
#rm -f *.csv
scrapy crawl --nolog economic_times #> economic_times.log
echo "done"
#sed -e 's/,,/, ,/g' failed_to_download.csv | column -s , -t | cat
}
function livem(){
echo "Cd to folder"
cd /home/runner/work/newspaper/newspaper
echo "in the folder"
#rm -f *.csv
scrapy crawl --nolog livemint #> livemint.log
echo "done"
#sed -e 's/,,/, ,/g' failed_to_download.csv | column -s , -t | cat
}
function indexp(){
echo "Cd to folder"
cd /home/runner/work/newspaper/newspaper
echo "in the folder"
#rm -f *.csv
scrapy crawl --nolog indian_express #> livemint.log
echo "done"
#sed -e 's/,,/, ,/g' failed_to_download.csv | column -s , -t | cat
}
function finexp(){
echo "Cd to folder"
cd /home/runner/work/newspaper/newspaper
echo "in the folder"
#rm -f *.csv
scrapy crawl --nolog financial_express #> livemint.log
echo "done"
#sed -e 's/,,/, ,/g' failed_to_download.csv | column -s , -t | cat
}
the_hindu
bustd
etime
finexp
livem
indexp