1 files changed, 183 insertions, 0 deletions
diff --git a/gallery_dl/extractor/imgur.py b/gallery_dl/extractor/imgur.py
new file mode 100644
index 0000000..0468c0b
--- /dev/null
+++ b/gallery_dl/extractor/imgur.py
@@ -0,0 +1,183 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2015-2019 Mike Fährmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extract images from https://imgur.com/"""
+
+from .common import Extractor, Message
+from .. import text, exception
+import json
+
+
+class ImgurExtractor(Extractor):
+    """Base class for imgur extractors"""
+    category = "imgur"
+
+    def __init__(self, match):
+        Extractor.__init__(self, match)
+        self.item_id = match.group(1)
+        self.mp4 = self.config("mp4", True)
+
+    def _get_data(self, urlpart):
+        response = self.request("https://imgur.com/" + urlpart, expect=(404,))
+        if response.status_code == 404:
+            raise exception.NotFoundError(self.subcategory)
+        data = text.extract(response.text, "image               : ", ",\n")[0]
+        return self._clean(json.loads(data))
+
+    def _prepare(self, image):
+        image["ext"] = image["ext"].partition("?")[0]
+        if image["ext"] == ".gif" and (
+                (self.mp4 and image["prefer_video"]) or self.mp4 == "always"):
+            image["ext"] = ".mp4"
+        url = "https://i.imgur.com/" + image["hash"] + image["ext"]
+        image["extension"] = image["ext"][1:]
+        return url
+
+    @staticmethod
+    def _clean(data):
+        try:
+            del data["adConfig"]
+            del data["isAd"]
+        except KeyError:
+            pass
+        return data
+
+
+class ImgurImageExtractor(ImgurExtractor):
+    """Extractor for individual images from imgur.com"""
+    subcategory = "image"
+    filename_fmt = "{category}_{hash}{title:?_//}.{extension}"
+    archive_fmt = "{hash}"
+    pattern = (r"(?:https?://)?(?:www\.|[im]\.|)?imgur\.com"
+               r"/(?!gallery)(\w{7}|\w{5})[sbtmlh]?\.?")
+    test = (
+        ("https://imgur.com/21yMxCS", {
+            "url": "6f2dcfb86815bdd72808c313e5f715610bc7b9b2",
+            "content": "0c8768055e4e20e7c7259608b67799171b691140",
+            "keyword": {
+                "animated": False,
+                "datetime": "2016-11-10 14:24:35",
+                "description": str,
+                "ext": ".png",
+                "extension": "png",
+                "hash": "21yMxCS",
+                "height": "32",
+                "is_moderated": False,
+                "is_safe": False,
+                "is_viral": 0,
+                "looping": False,
+                "mimetype": "image/png",
+                "name": None,
+                "prefer_video": False,
+                "size": 182,
+                "source": "",
+                "title": "Test",
+                "video_host": None,
+                "video_source": None,
+                "width": "64",
+            },
+        }),
+        ("http://imgur.com/0gybAXR", {  # gifv/mp4 video
+            "url": "a2220eb265a55b0c95e0d3d721ec7665460e3fd7",
+            "content": "a3c080e43f58f55243ab830569ba02309d59abfc",
+        }),
+        ("https://imgur.com/HjoXJAd", {  # url ends with '.jpg?1'
+            "url": "73f361b50753ab25da64160aa50bc5d139480d45",
+        }),
+        ("https://imgur.com/zzzzzzz", {  # not found
+            "exception": exception.NotFoundError,
+        }),
+        ("https://www.imgur.com/21yMxCS"),  # www
+        ("https://m.imgur.com/21yMxCS"),  # mobile
+        ("https://imgur.com/zxaY6"),  # 5 character key
+        ("https://i.imgur.com/21yMxCS.png"),  # direct link
+        ("https://i.imgur.com/21yMxCSh.png"),  # direct link thumbnail
+        ("https://i.imgur.com/zxaY6.gif"),  # direct link (short)
+        ("https://i.imgur.com/zxaY6s.gif"),  # direct link (short; thumb)
+    )
+
+    def items(self):
+        image = self._get_data(self.item_id)
+        url = self._prepare(image)
+
+        yield Message.Version, 1
+        yield Message.Directory, image
+        yield Message.Url, url, image
+
+
+class ImgurAlbumExtractor(ImgurExtractor):
+    """Extractor for image albums from imgur.com"""
+    subcategory = "album"
+    directory_fmt = ("{category}", "{album[hash]}{album[title]:? - //}")
+    filename_fmt = "{category}_{album[hash]}_{num:>03}_{hash}.{extension}"
+    archive_fmt = "{album[hash]}_{hash}"
+    pattern = (r"(?:https?://)?(?:www\.|m\.)?imgur\.com"
+               r"/(?:a|gallery|t/unmuted)/(\w{7}|\w{5})")
+    test = (
+        ("https://imgur.com/a/TcBmP", {
+            "url": "ce3552f550a5b5316bd9c7ae02e21e39f30c0563",
+            "keyword": {
+                "album": {
+                    "album_cover": "693j2Kr",
+                    "album_description": None,
+                    "cover": "693j2Kr",
+                    "datetime": "2015-10-09 10:37:50",
+                    "description": None,
+                    "hash": "TcBmP",
+                    "id": "TcBmP",
+                    "is_album": True,
+                    "num_images": "19",
+                    "title": "138",
+                    "title_clean": "TcBmP",
+                    "views": str,
+                },
+                "animated": bool,
+                "datetime": str,
+                "extension": str,
+                "hash": str,
+                "height": int,
+                "num": int,
+                "prefer_video": bool,
+                "size": int,
+                "title": str,
+                "width": int,
+            },
+        }),
+        ("https://imgur.com/gallery/eD9CT", {  # large album
+            "url": "4ee94de31ff26be416271bc0b1ea27b9349c9937",
+        }),
+        ("https://imgur.com/a/RhJXhVT/all", {  # 7 character album hash
+            "url": "695ef0c950023362a0163ee5041796300db76674",
+        }),
+        ("https://imgur.com/t/unmuted/YMqBcua", {  # unmuted URL
+            "url": "86b4747f8147cec7602f0214e267309af73a8655",
+        }),
+        ("https://imgur.com/a/TcBmQ", {
+            "exception": exception.NotFoundError,
+        }),
+        ("https://www.imgur.com/a/TcBmP"),  # www
+        ("https://m.imgur.com/a/TcBmP"),  # mobile
+    )
+
+    def items(self):
+        album = self._get_data("a/" + self.item_id + "/all")
+        images = album["album_images"]["images"]
+        del album["album_images"]
+
+        if int(album["num_images"]) > len(images):
+            url = ("https://imgur.com/ajaxalbums/getimages/" +
+                   self.item_id + "/hit.json")
+            images = self.request(url).json()["data"]["images"]
+
+        yield Message.Version, 1
+        yield Message.Directory, {"album": album, "count": len(images)}
+        for num, image in enumerate(images, 1):
+            url = self._prepare(image)
+            image["num"] = num
+            image["album"] = album
+            yield Message.Url, url, image