[pillowfort] add 'user' and 'post' extractors (#846)

mikf · Jan 25, 2021 · 7ca3bf7 · 7ca3bf7
1 parent 477ed01
commit 7ca3bf7
Show file tree

Hide file tree

Showing 4 changed files with 133 additions and 2 deletions.
diff --git a/docs/supportedsites.rst b/docs/supportedsites.rst
@@ -100,6 +100,7 @@ Pawoo                https://pawoo.net/                  Images from Statuses, U
 Photobucket          https://photobucket.com/            Albums, individual Images
 PhotoVogue           https://www.vogue.it/en/photovogue/ User Profiles
 Piczel               https://piczel.tv/                  Folders, individual Images, User Profiles
+Pillowfort           https://www.pillowfort.social/      Posts, User Profiles
 Pinterest            https://www.pinterest.com/          |pinterest-C|                                      Supported
 Pixiv                https://www.pixiv.net/              |pixiv-C|                                          Required
 Pixnet               https://www.pixnet.net/             Folders, individual Images, Sets, User Profiles

diff --git a/gallery_dl/extractor/__init__.py b/gallery_dl/extractor/__init__.py
@@ -86,6 +86,7 @@
     "photobucket",
     "photovogue",
     "piczel",
+    "pillowfort",
     "pinterest",
     "pixiv",
     "pixnet",

diff --git a/gallery_dl/extractor/pillowfort.py b/gallery_dl/extractor/pillowfort.py
@@ -0,0 +1,129 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2021 Mike Fährmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for https://www.pillowfort.social/"""
+
+from .common import Extractor, Message
+from .. import text
+
+BASE_PATTERN = r"(?:https?://)?www\.pillowfort\.social"
+
+
+class PillowfortExtractor(Extractor):
+    """Base class for pillowfort extractors"""
+    category = "pillowfort"
+    root = "https://www.pillowfort.social"
+    directory_fmt = ("{category}", "{username}")
+    filename_fmt = ("{post_id} {title|original_post[title]} "
+                    "{num:>02}.{extension}")
+    archive_fmt = "{id}"
+
+    def __init__(self, match):
+        Extractor.__init__(self, match)
+        self.item = match.group(1)
+
+    def items(self):
+        for post in self.posts():
+
+            files = post["media"]
+            del post["media"]
+
+            post["date"] = text.parse_datetime(
+                post["created_at"], "%Y-%m-%dT%H:%M:%S.%f%z")
+            yield Message.Directory, post
+
+            for post["num"], file in enumerate(files, 1):
+                url = file["url"]
+                post.update(file)
+                post["date"] = text.parse_datetime(
+                    file["created_at"], "%Y-%m-%dT%H:%M:%S.%f%z")
+                yield Message.Url, url, text.nameext_from_url(url, post)
+
+
+class PillowfortPostExtractor(PillowfortExtractor):
+    """Extractor for a single pillowfort post"""
+    subcategory = "post"
+    pattern = BASE_PATTERN + r"/posts/(\d+)"
+    test = ("https://www.pillowfort.social/posts/27510", {
+        "pattern": r"https://img\d+\.pillowfort\.social/posts/\w+_out\d+\.png",
+        "count": 4,
+        "keyword": {
+            "avatar_url": str,
+            "col": 0,
+            "commentable": True,
+            "comments_count": int,
+            "community_id": None,
+            "content": str,
+            "created_at": str,
+            "date": "type:datetime",
+            "deleted": None,
+            "deleted_at": None,
+            "deleted_by_mod": None,
+            "deleted_for_flag_id": None,
+            "embed_code": None,
+            "id": int,
+            "last_activity": str,
+            "last_activity_elapsed": str,
+            "last_edited_at": None,
+            "likes_count": int,
+            "media_type": "picture",
+            "nsfw": False,
+            "num": int,
+            "original_post_id": None,
+            "original_post_user_id": None,
+            "picture_content_type": None,
+            "picture_file_name": None,
+            "picture_file_size": None,
+            "picture_updated_at": None,
+            "post_id": 27510,
+            "post_type": "picture",
+            "privacy": "public",
+            "reblog_copy_info": list,
+            "rebloggable": True,
+            "reblogged_from_post_id": None,
+            "reblogged_from_user_id": None,
+            "reblogs_count": int,
+            "row": int,
+            "small_image_url": None,
+            "tags": list,
+            "time_elapsed": str,
+            "timestamp": str,
+            "title": "What is Pillowfort.io? ",
+            "updated_at": str,
+            "url": r"re:https://img3.pillowfort.social/posts/.*\.png",
+            "user_id": 5,
+            "username": "Staff"
+        },
+    })
+
+    def posts(self):
+        url = "{}/posts/{}/json/".format(self.root, self.item)
+        return (self.request(url).json(),)
+
+
+class PillowfortUserExtractor(PillowfortExtractor):
+    """Extractor for all posts of a pillowfort user"""
+    subcategory = "user"
+    pattern = BASE_PATTERN + r"/(?!posts/)([^/?#]+)"
+    test = ("https://www.pillowfort.social/Pome", {
+        "pattern": r"https://img\d+\.pillowfort\.social/posts/",
+        "range": "1-25",
+        "count": 25,
+    })
+
+    def posts(self):
+        url = "{}/{}/json/".format(self.root, self.item)
+        params = {"p": 1}
+
+        while True:
+            posts = self.request(url, params=params).json()["posts"]
+            yield from posts
+
+            if len(posts) < 20:
+                return
+            params["p"] += 1
diff --git a/gallery_dl/version.py b/gallery_dl/version.py
@@ -1,9 +1,9 @@
 # -*- coding: utf-8 -*-
 
-# Copyright 2016-2020 Mike Fährmann
+# Copyright 2016-2021 Mike Fährmann
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License version 2 as
 # published by the Free Software Foundation.
 
-__version__ = "1.16.4"
+__version__ = "1.16.5-dev"