summaryrefslogtreecommitdiffstats
path: root/gallery_dl/extractor/chan.py
diff options
context:
space:
mode:
Diffstat (limited to 'gallery_dl/extractor/chan.py')
-rw-r--r--gallery_dl/extractor/chan.py61
1 files changed, 61 insertions, 0 deletions
diff --git a/gallery_dl/extractor/chan.py b/gallery_dl/extractor/chan.py
new file mode 100644
index 0000000..5e44fd9
--- /dev/null
+++ b/gallery_dl/extractor/chan.py
@@ -0,0 +1,61 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2015-2019 Mike Fährmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Base classes for extractors for different Futaba Channel-like boards"""
+
+from .common import Extractor, Message
+from .. import text
+
+
+class ChanThreadExtractor(Extractor):
+ """Base class for extractors for Futaba Channel-like boards"""
+ category = "chan"
+ subcategory = "thread"
+ directory_fmt = ("{category}", "{board}", "{thread} - {title}")
+ filename_fmt = "{tim}-{filename}.{extension}"
+ archive_fmt = "{board}_{thread}_{tim}"
+ api_url = ""
+ file_url = ""
+
+ def __init__(self, match):
+ Extractor.__init__(self, match)
+ self.metadata = {
+ "board": match.group(1),
+ "thread": match.group(2),
+ }
+
+ def items(self):
+ yield Message.Version, 1
+ url = self.api_url.format_map(self.metadata)
+ posts = self.request(url).json()["posts"]
+ self.metadata["title"] = self.get_thread_title(posts[0])
+ yield Message.Directory, self.metadata
+ for post in posts:
+ if "filename" not in post:
+ continue
+ self.update(post)
+ yield Message.Url, self.build_url(post), post
+ if "extra_files" in post:
+ for file in post["extra_files"]:
+ self.update(post, file)
+ yield Message.Url, self.build_url(post), post
+
+ def update(self, post, data=None):
+ """Update keyword dictionary"""
+ post.update(data or self.metadata)
+ post["extension"] = post["ext"][1:]
+
+ def build_url(self, post):
+ """Construct an image url out of a post object"""
+ return self.file_url.format_map(post)
+
+ @staticmethod
+ def get_thread_title(post):
+ """Return thread title from first post"""
+ title = post["sub"] if "sub" in post else text.remove_html(post["com"])
+ return text.unescape(title)[:50]