From da3522aa76bc52ff835a0b12fda74d09bd7f1f03 Mon Sep 17 00:00:00 2001 From: scossa Date: Thu, 1 Dec 2022 23:26:10 +0100 Subject: [PATCH] Update 'ScrapeJE.py' --- ScrapeJE.py | 20 +++++++++++++++++--- 1 file changed, 17 insertions(+), 3 deletions(-) diff --git a/ScrapeJE.py b/ScrapeJE.py index c55d524..2bc5256 100644 --- a/ScrapeJE.py +++ b/ScrapeJE.py @@ -2,6 +2,9 @@ import requests from bs4 import BeautifulSoup #import cloudscraper #import json +import colorama +from colorama import Fore +from colorama import Style nome=[] desc=[] @@ -11,8 +14,14 @@ scripto=[] #prende l url della pagina justeat del ristorante in input -url = "https://www.justeat.it/restaurants-pizzeria-la-garganica-bologna/menu" +#url = "https://www.justeat.it/restaurants-pizzeria-girasole-bologna/menu" #url = input('link della pagina justeat del ristorante: ') +#input ('inserisci il link della pagina justeat del ristorante: ') + +print("\n") +url = print(Fore.WHITE + Style.DIM + "es https://www.justeat.it/NOME_RISTORANTE/menu" + Style.RESET_ALL) +url = input(Fore.RED + Style.BRIGHT + "inserisci il link della pagina justeat del ristorante: " + Style.RESET_ALL) + #scrape html scavalcando cloudflare # scraper = cloudscraper.create_scraper(browser={'browser': 'firefox','platform': 'windows','mobile': False}) @@ -56,8 +65,13 @@ for menu in soup.find_all(attrs={"data-test-id": "menu-item"}): att=menu #riempie la lista "nome" for att in menu.find(attrs={"data-test-id": "menu-item-name"}): - if att != " ": - nome.append(att.lstrip().splitlines()[0]) + if att != type(None): + if att != " ": + nome.append(att.lstrip().splitlines()[0]) + break + else: + continue + #riempie la lista "desc" att=menu.find("p", class_="c-menuItems-description")