From b8df76cfbffbb252fd653021782b536bcf80467b Mon Sep 17 00:00:00 2001
From: Joakim Holm <mail@joakimholm.xyz>
Date: Tue, 9 Jan 2024 14:44:39 +0100
Subject: [PATCH] Add DC Universe Infinte Source

---
 README.md                               |   1 +
 grawlix/__main__.py                     |  25 +++-
 grawlix/assets/errors/access_denied.txt |   3 +
 grawlix/book.py                         |   2 +
 grawlix/exceptions.py                   |   3 +
 grawlix/sources/__init__.py             |   2 +
 grawlix/sources/dcuniverseinfinite.py   | 169 ++++++++++++++++++++++++
 7 files changed, 199 insertions(+), 6 deletions(-)
 create mode 100644 grawlix/assets/errors/access_denied.txt
 create mode 100644 grawlix/sources/dcuniverseinfinite.py

diff --git a/README.md b/README.md
index 4bb3acc..db78853 100644
--- a/README.md
+++ b/README.md
@@ -8,6 +8,7 @@ CLI ebook downloader
 
 ## Supported services
 grawlix currently supports downloading from the following sources:
+- [DC Universe Infinite](https://www.dcuniverseinfinite.com)
 - [eReolen](https://ereolen.dk)
 - [fanfiction.net](https://www.fanfiction.net)
 - [Flipp](https://flipp.dk)
diff --git a/grawlix/__main__.py b/grawlix/__main__.py
index 139dcf0..5b9bf6c 100644
--- a/grawlix/__main__.py
+++ b/grawlix/__main__.py
@@ -1,6 +1,6 @@
 from .book import Book, Series
 from .config import load_config, Config, SourceConfig
-from .exceptions import SourceNotAuthenticated, GrawlixError
+from .exceptions import SourceNotAuthenticated, GrawlixError, AccessDenied
 from .sources import load_source, Source
 from .output import download_book
 from . import  arguments, logging
@@ -105,11 +105,7 @@ async def main() -> None:
                     template: str = args.output or "{title}.{ext}"
                     await download_with_progress(result, progress, template)
             elif isinstance(result, Series):
-                template = args.output or "{series}/{title}.{ext}"
-                with logging.progress(result.title, source.name, len(result.book_ids)) as progress:
-                    for book_id in result.book_ids:
-                        book: Book = await source.download_book_from_id(book_id)
-                        await download_with_progress(book, progress, template)
+                await download_series(source, result, args)
             logging.info("")
         except GrawlixError as error:
             error.print_error()
@@ -118,6 +114,23 @@ async def main() -> None:
             exit(1)
 
 
+async def download_series(source: Source, series: Series, args) -> None:
+    """
+    Download books in series
+
+    :param series: Series to download
+    """
+    template = args.output or "{series}/{title}.{ext}"
+    with logging.progress(series.title, source.name, len(series.book_ids)) as progress:
+        for book_id in series.book_ids:
+            try:
+                book: Book = await source.download_book_from_id(book_id)
+                await download_with_progress(book, progress, template)
+            except AccessDenied as error:
+                logging.info("Skipping - Access Denied")
+
+
+
 async def download_with_progress(book: Book, progress: Progress, template: str):
     """
     Download book with progress bar in cli
diff --git a/grawlix/assets/errors/access_denied.txt b/grawlix/assets/errors/access_denied.txt
new file mode 100644
index 0000000..f2a1be8
--- /dev/null
+++ b/grawlix/assets/errors/access_denied.txt
@@ -0,0 +1,3 @@
+[red]ERROR: Access denied[/red]
+
+You do not have access to the book you are trying to download.
diff --git a/grawlix/book.py b/grawlix/book.py
index 7de10ef..6fac2ab 100644
--- a/grawlix/book.py
+++ b/grawlix/book.py
@@ -8,6 +8,7 @@ class Metadata:
     """Metadata about a book"""
     title: str
     series: Optional[str] = None
+    index: Optional[int] = None
     authors: list[str] = field(default_factory=list)
     language: Optional[str] = None
     publisher: Optional[str] = None
@@ -19,6 +20,7 @@ class Metadata:
         return {
             "title": self.title,
             "series": self.series or "UNKNOWN",
+            "index": self.index or "UNKNOWN",
             "publisher": self.publisher or "UNKNOWN",
             "identifier": self.identifier or "UNKNOWN",
             "language": self.language or "UNKNOWN",
diff --git a/grawlix/exceptions.py b/grawlix/exceptions.py
index 1832740..aeea79b 100644
--- a/grawlix/exceptions.py
+++ b/grawlix/exceptions.py
@@ -28,3 +28,6 @@ class SourceNotAuthenticated(GrawlixError):
 
 class ThrottleError(GrawlixError):
     error_file = "throttle"
+
+class AccessDenied(GrawlixError):
+    error_file = "access_denied"
diff --git a/grawlix/sources/__init__.py b/grawlix/sources/__init__.py
index 94adfd0..cab6155 100644
--- a/grawlix/sources/__init__.py
+++ b/grawlix/sources/__init__.py
@@ -1,6 +1,7 @@
 from grawlix.exceptions import InvalidUrl
 
 from .source import Source
+from .dcuniverseinfinite import DcUniverseInfinite
 from .ereolen import Ereolen
 from .fanfictionnet import FanfictionNet
 from .flipp import Flipp
@@ -55,6 +56,7 @@ def get_source_classes() -> list[type[Source]]:
     :returns: A list of all available source types
     """
     return [
+        DcUniverseInfinite,
         Ereolen,
         FanfictionNet,
         Flipp,
diff --git a/grawlix/sources/dcuniverseinfinite.py b/grawlix/sources/dcuniverseinfinite.py
new file mode 100644
index 0000000..9831dbd
--- /dev/null
+++ b/grawlix/sources/dcuniverseinfinite.py
@@ -0,0 +1,169 @@
+from grawlix import logging
+from grawlix.book import Result, Book, Metadata, OnlineFile, ImageList, Series
+from grawlix.encryption import Encryption
+from grawlix.exceptions import InvalidUrl, AccessDenied
+from .source import Source
+
+import re
+from typing import Tuple, List
+from hashlib import sha256
+from Crypto.Cipher import AES
+
+class DcUniverseInfinite(Source):
+    name = "DC Universe Infinite"
+    match: list[str] = [
+        # Reader page
+        r"https://www.dcuniverseinfinite.com/comics/book/[^/]+/[^/]+/c/reader",
+        # Issue info page
+        r"https://www.dcuniverseinfinite.com/comics/book/[^/]+/[^/]+/c",
+        # Series info page
+        r"https://www.dcuniverseinfinite.com/comics/series/[^/]+/[^/]+"
+    ]
+    _authentication_methods = [ "cookies" ]
+
+
+    async def download(self, url: str) -> Result:
+        # Set headers
+        auth_token = self._client.cookies.get("session")
+        self._client.headers.update({
+            "Authorization": f"Token {auth_token}",
+            "X-Consumer-Key": await self.download_consumer_secret()
+        })
+        self.plan = await self.download_plan()
+        logging.debug(f"{self.plan=}")
+        # Download book
+        typ, id = self.extract_id_from_url(url)
+        if typ == "book":
+            logging.debug(f"Book id: {id}")
+            return await self.download_book_from_id(id)
+        else:
+            logging.debug(f"Series id: {id}")
+            return await self.download_series(id)
+
+
+    async def download_series(self, series_id: str) -> Series[str]:
+        # TODO Check for ultra releases
+        response = await self._client.get(
+            f"https://www.dcuniverseinfinite.com/api/comics/1/series/{series_id}/?trans=en"
+        )
+        content = response.json()
+        return Series(
+            title = content["title"],
+            book_ids = [x for x in content["book_uuids"]["issue"]]
+        )
+
+
+    async def download_book_from_id(self, book_id: str) -> Book:
+        return Book(
+            data = await self.download_pages(book_id),
+            metadata = await self.download_book_metadata(book_id)
+        )
+
+
+    async def download_pages(self, book_id: str) -> ImageList:
+        """
+        Download comic pages
+
+        :param book_id: Id of comic
+        :return: List of comic pages
+        """
+        response = await self._client.get(
+            f"https://www.dcuniverseinfinite.com/api/5/1/rights/comic/{book_id}?trans=en"
+        )
+        jwt = response.json()
+        response = await self._client.get(
+            "https://www.dcuniverseinfinite.com/api/comics/1/book/download/?page=1&quality=HD&trans=en",
+            headers = {
+                "X-Auth-JWT": jwt
+            }
+        )
+        response = response.json()
+        if not "uuid" in response:
+            raise AccessDenied
+        uuid = response["uuid"]
+        job_id = response["job_id"]
+        format_id = response["format"]
+        images: List[OnlineFile] = []
+        for page in response["images"]:
+            page_number = page["page_number"]
+            images.append(OnlineFile(
+                url = page["signed_url"],
+                extension = "jpg",
+                encryption = DcUniverseInfinteEncryption(uuid, page_number, job_id, format_id)
+            ))
+        return ImageList(images)
+
+
+    async def download_book_metadata(self, book_id: str) -> Metadata:
+        """
+        Download book metadata
+
+        :param book_id: Id of book
+        :return: Book metadata
+        """
+        response = await self._client.get(
+            f"https://www.dcuniverseinfinite.com/api/comics/1/book/{book_id}/?trans=en"
+        )
+        content = response.json()
+        return Metadata(
+            title = content["title"],
+            series = content["series_title"],
+            index = int(content["issue_number"]),
+            publisher = "DC"
+        )
+
+
+    def extract_id_from_url(self, url: str) -> Tuple[str, str]:
+        """
+        Extract book or series id from url
+
+        :param url: Url of page with id
+        :return: Type (book or series) and id
+        """
+        match_index = self.get_match_index(url)
+        if match_index == 0:
+            book_id = url.split("/")[-3]
+            return ("book", book_id)
+        if match_index == 1:
+            book_id = url.split("/")[-2]
+            return ("book", book_id)
+        if match_index == 2:
+            series_id = url.split("/")[-1]
+            return ("series", series_id)
+        raise InvalidUrl
+
+
+    async def download_consumer_secret(self) -> str:
+        """Download consumer secret"""
+        response = await self._client.get(
+            "https://www.dcuniverseinfinite.com/api/5/consumer/www?trans=en"
+        )
+        return response.json()["consumer_secret"]
+
+
+    async def download_plan(self) -> str:
+        """Download user subscribtion plan"""
+        response = await self._client.get(
+            "https://www.dcuniverseinfinite.com/api/claims/?trans=en"
+        )
+        return response.json()["data"]["urn:df:clm:premium"]["plan"]
+
+
+class DcUniverseInfinteEncryption:
+    key: bytes
+
+    def __init__(self, uuid: str, page_number: int, job_id: str, format_id: str):
+        string_key = f"{uuid}{page_number}{job_id}{format_id}"
+        self.key = sha256(string_key.encode("utf8")).digest()
+
+
+    def decrypt(self, data: bytes) -> bytes:
+        # The first 8 bytes contains the size of the output file
+        original_size = int.from_bytes(data[0:8], byteorder="little")
+        # The next 16 bytes are the initialization vector
+        iv = data[8:24]
+        # The rest of the data is the encrypted image
+        encrypted_image = data[24:]
+        # Decrypting image
+        cipher = AES.new(self.key, AES.MODE_CBC, iv)
+        return cipher.decrypt(encrypted_image)