upload to new gitea

This commit is contained in:
Remy Moll
2022-08-23 15:12:39 +02:00
parent 9ca4985853
commit 40498ac8f0
4 changed files with 41 additions and 104 deletions

View File

@@ -155,11 +155,11 @@ class PDFDownloader:
hrefs = [e.get_attribute("href") for e in self.driver.find_elements_by_xpath("//a[@href]")]
except:
hrefs = []
len_old = len(hrefs)
# len_old = len(hrefs)
hrefs = [h for h in hrefs \
if not sum([(domain in h) for domain in blacklisted]) # sum([True, False, False, False]) == 1 (esp. not 0)
] # filter a tiny bit at least
self.logger.info(f"Hrefs filtered (before: {len_old}, after: {len(hrefs)})")
# self.logger.info(f"Hrefs filtered (before: {len_old}, after: {len(hrefs)})")
return hrefs