get-definitions: avoid ambiguity loops

This commit is contained in:
dece 2021-03-16 00:46:07 +01:00
parent 5fb2c37142
commit ada70b65e7

View file

@ -10,6 +10,7 @@ from requests import models
BASE_URL = "https://www.cnrtl.fr/definition/" BASE_URL = "https://www.cnrtl.fr/definition/"
CRIMINAL_SCUM = []
def main(): def main():
@ -59,10 +60,11 @@ def get_definitions(form):
if h2: if h2:
title = str(h2.string).strip() title = str(h2.string).strip()
if title == "Terme introuvable": if title == "Terme introuvable":
CRIMINAL_SCUM.append(form)
links = contentbox("a") links = contentbox("a")
for link in links: for link in links:
alternative_form = str(link.string).strip() alternative_form = str(link.string).strip()
if alternative_form == form: if alternative_form in CRIMINAL_SCUM:
continue continue
get_definitions(alternative_form) get_definitions(alternative_form)
elif title == "Erreur": elif title == "Erreur":