From f50c8e5fdc8a39d7977d4b2516c67b5ac067d56c Mon Sep 17 00:00:00 2001 From: Notisset Date: Fri, 10 Nov 2017 00:55:37 +0100 Subject: [PATCH] Initial commit --- .gitignore | 2 ++ scraper.py | 20 ++++++++++++++++++++ 2 files changed, 22 insertions(+) create mode 100644 .gitignore create mode 100755 scraper.py diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..c6ef218 --- /dev/null +++ b/.gitignore @@ -0,0 +1,2 @@ +.idea + diff --git a/scraper.py b/scraper.py new file mode 100755 index 0000000..16ea9ce --- /dev/null +++ b/scraper.py @@ -0,0 +1,20 @@ +#! /usr/bin/env python +import requests +from bs4 import BeautifulSoup + +headers = requests.utils.default_headers() +headers.update({"User-Agent": "Mozilla/5.0"}) + +data = { + 'codiceStazione': 'S01700Milano+Centrale', + 'lang': 'IT', +} + +r = requests.post('http://viaggiatreno.it/vt_pax_internet/mobile/stazione', headers=headers, data=data) + +print(r.text.encode('utf-8')) +soup = BeautifulSoup(r.text, 'html.parser') +treni = soup.find_all("div", class_="bloccorisultato") + +for treno in treni: + print(treno) \ No newline at end of file