From e761964bea84b4ec13f2cfd23a2f7ecde3e7991d15896867045bcefbc482325e Mon Sep 17 00:00:00 2001 From: Ben Varick Date: Fri, 7 Nov 2025 18:07:35 -0800 Subject: [PATCH] added agency_list.csv.sample and updated README --- .gitignore | 3 +++ README.md | 4 +++- config/agency_list.csv.sample | 4 ++++ 3 files changed, 10 insertions(+), 1 deletion(-) create mode 100644 config/agency_list.csv.sample diff --git a/.gitignore b/.gitignore index 326a612..b78c6b2 100644 --- a/.gitignore +++ b/.gitignore @@ -1,6 +1,9 @@ #Exclude the .env file .env +# Exclude agency_list.csv +config/agency_list.csv + #Exclude contents of the postres_data directory postgres_data postgres_data/* diff --git a/README.md b/README.md index acd1cb8..88ba99a 100644 --- a/README.md +++ b/README.md @@ -3,7 +3,7 @@ Dagster setup that scrapes GTFS and GTFS-RT for specified transit agencies and adds them to a DuckDB ## Input -This reads from the `config/agency_list.csv` file, edit this file to include the transit agencies that you want to scrape, add the relevant IDs from mobilitydatabase.org +This reads from the `config/agency_list.csv` file, copy `agency_list.csv.sample` to `agency_list.csv` and edit this file to include the transit agencies that you want to scrape, add the relevant IDs from mobilitydatabase.org ## set your environment @@ -13,6 +13,8 @@ copy `env.sample` to `.env` and change: - MobilityDatabase.org API token - Location of data, config, and postgres_data directories (default is in working directory) + + # Run it `docker compose build` `docker compose up -d` diff --git a/config/agency_list.csv.sample b/config/agency_list.csv.sample new file mode 100644 index 0000000..6c014a9 --- /dev/null +++ b/config/agency_list.csv.sample @@ -0,0 +1,4 @@ +Name,GTFS,GTFS-RT_vehicles,GTFS-RT_trips,GTFS-RT_alerts +Madison Metro,mdb-394,mdb-2097,mdb-2096,mdb-2095 +Milwaukee County Transit System,mdb-2127,mdb-2130,mdb-2128,mdb-2129 +Whatcom Transportation Authority,mdb-284,tld-4358-vp,tld-4358-tu,tld-4358-sa