From 4f89c7b7eaf75f11a21a08186e3ed18d61dd92c1 Mon Sep 17 00:00:00 2001 From: f0x1 Date: Fri, 14 Jan 2022 17:36:59 +0100 Subject: [PATCH] first commit --- README.md | 0 ZeitOnlineRequests.py | 18 ++++++++++++++++++ 2 files changed, 18 insertions(+) create mode 100644 README.md create mode 100644 ZeitOnlineRequests.py diff --git a/README.md b/README.md new file mode 100644 index 0000000..e69de29 diff --git a/ZeitOnlineRequests.py b/ZeitOnlineRequests.py new file mode 100644 index 0000000..f783b60 --- /dev/null +++ b/ZeitOnlineRequests.py @@ -0,0 +1,18 @@ +# -*- coding: utf-8 -*- +import os, requests, shutil +from bs4 import BeautifulSoup +from time import time +from multiprocessing.pool import ThreadPool + +base_url = 'https://www.zeit.de/serie/die-kaenguru-comics?p=' + + +for page in range(1, 15): + page_url = base_url + str(page) + print(page_url) + r = requests.get(page_url) + soup = BeautifulSoup(r.text, 'html.parser') + articles = soup.find_all('article') + for article in articles: + comic_title = article.a.contents + print(comic_title) \ No newline at end of file