So dekodieren Sie den UTF-8-Text aus der Zeitung3k-Bibliothek
Posted: 31 Aug 2025, 13:44
Code: Select all
class ArticleScraper:
def __init__(self):
pass
def articleScraper(self, article_links):
article_content = []
for url in article_links:
url_i = newspaper.Article(url="%s" % (url), language='en')
url_i.download()
url_i.parse()
content = (f"TITLE:{url_i.title} ARTICLES: {url_i.text}")
print(urllib.parse.unquote(content))
article_content.append(content)
return ("\n".join(article_content))
sol = ArticleScraper()
print(sol.articleScraper(list_of_urls))