summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorAnton Luka Šijanec <anton@sijanec.eu>2023-02-19 20:13:13 +0100
committerAnton Luka Šijanec <anton@sijanec.eu>2023-02-19 20:13:13 +0100
commit78f50ab8b4bd57cd67d015fa2608bc86b116dfba (patch)
tree4a4d943bffe0eeab63be12d7e91b1d79e60db591
parentrš cv (diff)
downloadr-78f50ab8b4bd57cd67d015fa2608bc86b116dfba.tar
r-78f50ab8b4bd57cd67d015fa2608bc86b116dfba.tar.gz
r-78f50ab8b4bd57cd67d015fa2608bc86b116dfba.tar.bz2
r-78f50ab8b4bd57cd67d015fa2608bc86b116dfba.tar.lz
r-78f50ab8b4bd57cd67d015fa2608bc86b116dfba.tar.xz
r-78f50ab8b4bd57cd67d015fa2608bc86b116dfba.tar.zst
r-78f50ab8b4bd57cd67d015fa2608bc86b116dfba.zip
-rwxr-xr-xskripti/4chan-thread-dl.py12
1 files changed, 9 insertions, 3 deletions
diff --git a/skripti/4chan-thread-dl.py b/skripti/4chan-thread-dl.py
index 7a71df2..f1e2717 100755
--- a/skripti/4chan-thread-dl.py
+++ b/skripti/4chan-thread-dl.py
@@ -6,6 +6,12 @@ if len(argv) != 3:
raise Exception("prvi arg je url do threada, drugi arg je končnica, recimo .webm")
s = BeautifulSoup(get(argv[1]).content, "html.parser")
for a in s.find_all("a"):
- if a.attrs["href"].endswith(argv[2]) and "title" in a.attrs and "/" not in a.attrs["title"]:
- print(a.attrs["title"])
- open(a.attrs["title"], "wb").write(get("http:" + a.attrs["href"]).content)
+ if a.attrs["href"].endswith(argv[2]):
+ fn = None
+ if "title" in a.attrs and "/" not in a.attrs["title"]:
+ fn = a.attrs["title"]
+ elif "/" not in a.getText() and ("class" not in a.attrs or "fileThumb" not in a.attrs["class"]):
+ fn = a.getText()
+ if fn is not None:
+ print(fn)
+ open(fn, "wb").write(get("http:" + a.attrs["href"]).content)