mirror of
https://github.com/guezoloic/millesima_projetS6.git
synced 2026-03-28 19:13:42 +00:00
ajout(main.py): ajout dans csv
This commit is contained in:
2
.gitignore
vendored
2
.gitignore
vendored
@@ -205,3 +205,5 @@ cython_debug/
|
|||||||
marimo/_static/
|
marimo/_static/
|
||||||
marimo/_lsp/
|
marimo/_lsp/
|
||||||
__marimo__/
|
__marimo__/
|
||||||
|
|
||||||
|
*.csv
|
||||||
7
main.py
7
main.py
@@ -299,10 +299,11 @@ class Scraper:
|
|||||||
except JSONDecodeError | HTTPError:
|
except JSONDecodeError | HTTPError:
|
||||||
return None
|
return None
|
||||||
|
|
||||||
def getvins(self, subdir: str):
|
def getvins(self, subdir: str, filename: str):
|
||||||
cache: set[str] = set[str]()
|
cache: set[str] = set[str]()
|
||||||
page = 0
|
page = 0
|
||||||
|
|
||||||
|
with open(filename, 'a') as f:
|
||||||
while True:
|
while True:
|
||||||
page += 1
|
page += 1
|
||||||
products_list = self._geturlproductslist(f"{subdir}?page={page}")
|
products_list = self._geturlproductslist(f"{subdir}?page={page}")
|
||||||
@@ -320,10 +321,12 @@ class Scraper:
|
|||||||
if link and link not in cache:
|
if link and link not in cache:
|
||||||
try:
|
try:
|
||||||
infos = self.getjsondata(link).informations()
|
infos = self.getjsondata(link).informations()
|
||||||
|
_ = f.write(infos + "\n")
|
||||||
print(infos)
|
print(infos)
|
||||||
cache.add(link)
|
cache.add(link)
|
||||||
except JSONDecodeError | HTTPError as e:
|
except JSONDecodeError | HTTPError as e:
|
||||||
print(f"Erreur sur le produit {link}: {e}")
|
print(f"Erreur sur le produit {link}: {e}")
|
||||||
|
f.flush()
|
||||||
|
|
||||||
|
|
||||||
# Scraper().getvins("bordeaux.html")
|
Scraper().getvins("bordeaux.html", "donnee.csv")
|
||||||
|
|||||||
Reference in New Issue
Block a user