2022-08-28 14:57:40 +02:00
|
|
|
import asyncio
|
|
|
|
import aiohttp
|
|
|
|
|
|
|
|
import csv
|
|
|
|
from datetime import datetime
|
|
|
|
from bs4 import BeautifulSoup
|
|
|
|
import re
|
|
|
|
|
|
|
|
|
|
|
|
async def main():
|
|
|
|
stations = []
|
|
|
|
with open('stations.csv') as station_file:
|
|
|
|
stations_list = csv.reader(station_file)
|
|
|
|
for row in stations_list:
|
|
|
|
stations.append(row[1])
|
|
|
|
|
|
|
|
trains = []
|
|
|
|
async with aiohttp.ClientSession() as session:
|
|
|
|
tasks = []
|
2022-08-31 00:08:54 +02:00
|
|
|
for station in stations[:10]:
|
2022-08-28 14:57:40 +02:00
|
|
|
tasks.append(fetch_station(station, session, trains))
|
|
|
|
await asyncio.gather(*tasks)
|
|
|
|
|
|
|
|
print(trains)
|
2022-08-31 00:08:54 +02:00
|
|
|
async with aiohttp.ClientSession() as session:
|
|
|
|
tasks = []
|
|
|
|
for train in trains[:5]:
|
|
|
|
tasks.append(fetch_train(train, session))
|
|
|
|
await asyncio.gather(*tasks)
|
2022-08-28 14:57:40 +02:00
|
|
|
|
|
|
|
|
|
|
|
async def fetch_station(station: str, session: aiohttp.ClientSession, trains: list) -> None:
|
|
|
|
train_list = []
|
|
|
|
url = "http://www.belgianrail.be/jp/nmbs-realtime/stboard.exe/en"
|
2022-08-28 16:26:50 +02:00
|
|
|
url_header = {'User-Agent': 'python script to fetch trains of belgium. (d.tonitch@gmail.com - in case it is a problem)',
|
|
|
|
'From': 'd.tonitch@gmail.com'}
|
2022-08-28 14:57:40 +02:00
|
|
|
url_data = {
|
|
|
|
'realtime': 'Show', # Dunno
|
|
|
|
'sqQueryPageDisplayed': 'yes', # Dunno
|
|
|
|
'REQProduct_list+': '5:1111111000000000', # Dunno
|
|
|
|
'input': station,
|
|
|
|
'REQ0JourneyStopsSID+':
|
|
|
|
'A=1@O=Mouscron@X=3228449@Y=50740997@U=80@L=008885704@B=1@p=1661553118@n=ac.1=GA@',
|
|
|
|
# Don't know what it does so I don't touch
|
|
|
|
'date': datetime.now().strftime('%d/%m/%Y'),
|
|
|
|
'wDayExtsq': 'Mo|Tu|We|Th|Fr|Sa|Su', # Didn't try
|
|
|
|
'time': datetime.now().strftime('%H:%M'),
|
|
|
|
'boardType': 'dep',
|
|
|
|
'maxJourneys': '10', # can be changed but have to be > 10
|
|
|
|
'start': 'Show' # Dunno
|
|
|
|
}
|
|
|
|
try:
|
2022-08-28 16:26:50 +02:00
|
|
|
async with session.post(url, data=url_data, headers=url_header) as resp:
|
2022-08-28 14:57:40 +02:00
|
|
|
if resp.status == 200:
|
|
|
|
print(f"station {station} success ✅")
|
|
|
|
soup = BeautifulSoup(await resp.text(), 'html.parser')
|
|
|
|
products = soup.body.find_all(class_='product')[1:]
|
|
|
|
[i.a.img.decompose() for i in products]
|
|
|
|
train_list = [''.join(i.a.contents) for i in products]
|
|
|
|
for train in train_list:
|
|
|
|
if train not in trains and train:
|
2022-08-28 16:26:50 +02:00
|
|
|
trains.append(re.sub(" +", " ", train.strip()))
|
2022-08-28 14:57:40 +02:00
|
|
|
return None
|
|
|
|
except aiohttp.client_exceptions.ServerDisconnectedError:
|
|
|
|
print(f"station {station} failed ❎ ")
|
|
|
|
|
2022-08-31 00:08:54 +02:00
|
|
|
async def fetch_train(train:str, session: aiohttp.ClientSession):
|
|
|
|
url = "http://www.belgianrail.be/jp/nmbs-realtime/trainsearch.exe/fn?ld=std&"
|
|
|
|
url_header = {'User-Agent': 'python script to fetch trains of belgium. (d.tonitch@gmail.com - in case it is a problem)',
|
|
|
|
'From': 'd.tonitch@gmail.com'}
|
|
|
|
url_data = {
|
|
|
|
'trainname':train.replace(" ", "+"),
|
|
|
|
'selectDate':'oneday',
|
|
|
|
'date':datetime.now().strftime('%d/%m/%Y'),
|
|
|
|
'productClassFilter':'85',
|
|
|
|
'start':'Chercher'
|
|
|
|
}
|
|
|
|
try:
|
|
|
|
async with session.post(url, data=url_data, headers=url_header) as resp:
|
|
|
|
if resp.status == 200:
|
|
|
|
print(f"train {train} success ✅")
|
|
|
|
soup = BeautifulSoup(await resp.text(), 'html.parser')
|
|
|
|
products = soup.body.find_all("td")
|
|
|
|
print(soup.body.prettify())
|
|
|
|
except aiohttp.client_exceptions.ServerDisconnectedError:
|
|
|
|
print(f"train {train} failed ❎ ")
|
|
|
|
|
2022-08-28 14:57:40 +02:00
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
asyncio.run(main())
|