Data Fetching #1358
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Data Fetching | |
on: | |
push: | |
schedule: | |
- cron: "5 19 * * *" | |
workflow_dispatch: | |
jobs: | |
Fetch-Route-Data: | |
runs-on: ubuntu-latest | |
steps: | |
- name: Check out repository code | |
uses: actions/checkout@v4 | |
- name: Setup Python environment | |
uses: actions/setup-python@v5 | |
with: | |
python-version: '3.12' | |
architecture: 'x64' | |
cache: 'pip' | |
cache-dependency-path: crawling/requirements.txt | |
- name: Install dependencies | |
run: | | |
python -m pip install --upgrade pip | |
pip install -r ./crawling/requirements.txt | |
- name: Crawling resources | |
env: | |
REQUEST_LIMIT: "6" | |
run: | | |
set -o xtrace | |
python ./crawling/parseHoliday.py | |
python ./crawling/ctb.py | |
python ./crawling/kmb.py | |
python ./crawling/nlb.py | |
python ./crawling/lrtfeeder.py | |
python ./crawling/lightRail.py | |
python ./crawling/mtr.py | |
python ./crawling/parseJourneyTime.py | |
python ./crawling/parseGtfs.py | |
python ./crawling/parseGtfsEn.py | |
python ./crawling/gmb.py | |
python ./crawling/sunferry.py | |
python ./crawling/fortuneferry.py | |
python ./crawling/hkkf.py | |
python ./crawling/matchGtfs.py | |
python ./crawling/cleansing.py | |
python ./crawling/mergeRoutes.py | |
python ./crawling/mergeStopList.py | |
python ./crawling/routeCompare.py | |
python ./crawling/mtrExits.py | |
- name: Archive crawling outputs | |
uses: actions/upload-artifact@v4 | |
if: always() | |
with: | |
name: Crawled Files | |
retention-days: 14 | |
path: | | |
holiday.json | |
routeFareList* | |
routeList* | |
stopList* | |
stopMap* | |
routeTime.json | |
gtfs | |
gtfs.json | |
routeGtfs* | |
gtfs.zip | |
ROUTE_BUS.xml | |
route-ts/ | |
exits.mtr.json | |
- name: Update MD5 | |
run: | | |
md5sum routeFareList.min.json | cut -f1 -d ' ' | tr -d $'\n' > routeFareList.md5 | |
md5sum routeFareList.alpha.min.json | cut -f1 -d ' ' | tr -d $'\n' > routeFareList.alpha.md5 | |
- name: create deployment folder | |
run: mkdir -p build | |
- name: cp files into deployment folder | |
run: | | |
cp \ | |
routeFareList.json \ | |
routeFareList.min.json \ | |
routeFareList.alpha.json \ | |
routeFareList.alpha.min.json \ | |
routeFareList.md5 \ | |
routeFareList.alpha.md5 \ | |
CNAME \ | |
exits.mtr.json \ | |
build/ | |
- name: cp route-ts into deployment folder | |
run: cp -r route-ts build | |
- name: Update resources | |
uses: JamesIves/github-pages-deploy-action@v4 | |
with: | |
folder: build | |
commit-message: Update resources | |
branch: gh-pages | |
clean: false |