3 years ago · 92d8e75900
--- a/README.md
+++ b/README.md
@@ -4,4 +4,4 @@ This is a simple program to quickly install magazines etc. on [issuu.com](https:
 
															 ## Dependencies
														
 
															-This python script needs three non-standard python modules: termcolor, img2pdf and tqdm.
														
 
															+This python script needs three non-standard python modules: termcolor, img2pdf and tqdm, typer.
														
--- a/issuu-dl
+++ b/issuu-dl
@@ -1,20 +1,102 @@
 
															 #!/usr/bin/env python3
														
 
															 #
														
 
															-# issuu-dl v0.3
														
 
															+# issuu-dl v0.4
														
 
															 #
														
 
															 # download pdf from issuu.com
														
 
															 #
														
 
															-# tested (and working) on 04 Mar 2021
														
 
															+# tested (and working) on 05 Apr 2022
														
 
															-# arch-deps: python-tqdm, python-termcolor, img2pdf, python-validators
														
 
															+# arch-deps: python-tqdm, python-termcolor, img2pdf, python-validators, typer
														
 
															+import typer
														
 
															 import requests
														
 
															 import sys
														
 
															 import json
														
 
															 import img2pdf
														
 
															 import os
														
 
															+import shutil
														
 
															 from termcolor import colored
														
 
															 from tqdm import tqdm
														
 
															+from enum import Enum
														
 
															+app = typer.Typer(add_completion=False)
														
 
															+
														
 
															+
														
 
															+class outType(str, Enum):
														
 
															+    pdf = 'pdf'
														
 
															+    cbz = 'cbz'
														
 
															+
														
 
															+@app.command(no_args_is_help=True)
														
 
															+def greeting(url: str= typer.Argument(..., help='Full issuu url'), output_file: outType = typer.Option('pdf', "--output-type", "-o", help='Whether output is a pdf or cbz.')):
														
 
															+
														
 
															+    doc = url.split('/')
														
 
															+    try:
														
 
															+        doc = doc[3] + '/' + doc[5]
														
 
															+    except IndexError:
														
 
															+        errorMsg()
														
 
															+    print(doc)
														
 
															+    print("[*] doc is '{}'".format(colored(doc, 'yellow')))
														
 
															+    outfile_prefix = doc.replace('/', '_')
														
 
															+    outfile = outfile_prefix + "." + output_file
														
 
															+    pid = str(os.getpid())
														
 
															+
														
 
															+    print("[*] opening page...")
														
 
															+    s = requests.Session()
														
 
															+
														
 
															+    try:
														
 
															+        r = s.get(url)
														
 
															+    except requests.exceptions.TooManyRedirects:
														
 
															+        errorMsg()
														
 
															+    try:
														
 
															+        assert r.status_code == 200
														
 
															+    except AssertionError:
														
 
															+        errorMsg()
														
 
															+    print(colored("[+] url confirmed", "green"))
														
 
															+    assert 'issuu-reader3-embed-files' in r.content.decode()
														
 
															+    print(colored("[+] reader3 support confirmed", "green"))
														
 
															+
														
 
															+    print("[*] downloading reader3_4.json...")
														
 
															+
														
 
															+    r = s.get("https://reader3.isu.pub/{}/reader3_4.json".format(doc))
														
 
															+    j = json.loads(r.content.decode())
														
 
															+
														
 
															+    pubId = j["document"]["publicationId"]
														
 
															+    revId = j["document"]["revisionId"]
														
 
															+    pages = j["document"]["pages"]
														
 
															+
														
 
															+    print(colored("[+] fetched document data: ", "green") + colored("publicationId is {}, revisionId is {}".format(pubId, revId), "yellow"))
														
 
															+    print(colored("[+] found {} pages".format(len(pages)), "green"))
														
 
															+
														
 
															+    print("[*] downloading pages...")
														
 
															+
														
 
															+    filenames = []
														
 
															+    directoryName = pid+"_"+outfile_prefix
														
 
															+    os.mkdir(directoryName)
														
 
															+    for page in tqdm(pages):
														
 
															+        i = page["imageUri"].split('/')
														
 
															+        f = os.path.join(directoryName, i[1]+"-"+i[3])
														
 
															+        r = s.get("https://"+page["imageUri"])
														
 
															+        open(f, "wb").write(r.content)
														
 
															+        filenames.append(f)
														
 
															+
														
 
															+    print(colored("[+] downloaded {} jpg files".format(len(pages), "green")))
														
 
															+
														
 
															+    if output_file == "pdf":
														
 
															+        print("[*] converting to single pdf...")
														
 
															+        with open(outfile, "wb") as out:
														
 
															+            out.write(img2pdf.convert(filenames))
														
 
															+
														
 
															+        print(colored("[+] output pdf '{}' is ready".format(colored(outfile, "yellow")), "green"))
														
 
															+    else:
														
 
															+        print("[*] converting to single cbz...")
														
 
															+        shutil.make_archive(outfile, 'zip', directoryName)
														
 
															+        os.rename(outfile+".zip", outfile)
														
 
															+        print(colored("[+] output cbz '{}' is ready".format(colored(outfile, "yellow")), "green"))
														
 
															+
														
 
															+    print("[*] cleaning up jpg files...")
														
 
															+    for f in filenames:
														
 
															+        os.remove(f)
														
 
															+    os.rmdir(directoryName)
														
 
															+
														
 
															 def usage():
														
 
															     print("USAGE: issuu-dl [full issuu url of target document]")
														
@@ -24,67 +106,8 @@ def errorMsg():
 
															     print("Error: wrong URL format, please recheck your link")
														
 
															     exit()
														
 
															-try:
														
 
															-    url = sys.argv[1]
														
 
															-except:
														
 
															-    usage()
														
 
															-
														
 
															-doc = url.split('/')
														
 
															-try:
														
 
															-    doc = doc[3] + '/' + doc[5]
														
 
															-except IndexError:
														
 
															-    errorMsg()
														
 
															-print(doc)
														
 
															-print("[*] doc is '{}'".format(colored(doc, 'yellow')))
														
 
															-outfile = doc.replace('/', '_') + ".pdf"
														
 
															-
														
 
															-print("[*] opening page...")
														
 
															-s = requests.Session()
														
 
															-
														
 
															-try:
														
 
															-    r = s.get(url)
														
 
															-except requests.exceptions.TooManyRedirects:
														
 
															-    errorMsg()
														
 
															-try:
														
 
															-    assert r.status_code == 200
														
 
															-except AssertionError:
														
 
															-    errorMsg()
														
 
															-print(colored("[+] url confirmed", "green"))
														
 
															-assert 'issuu-reader3-embed-files' in r.content.decode()
														
 
															-print(colored("[+] reader3 support confirmed", "green"))
														
 
															-
														
 
															-print("[*] downloading reader3_4.json...")
														
 
															-
														
 
															-r = s.get("https://reader3.isu.pub/{}/reader3_4.json".format(doc))
														
 
															-j = json.loads(r.content.decode())
														
 
															-
														
 
															-pubId = j["document"]["publicationId"]
														
 
															-revId = j["document"]["revisionId"]
														
 
															-pages = j["document"]["pages"]
														
 
															-
														
 
															-print(colored("[+] fetched document data: ", "green") + colored("publicationId is {}, revisionId is {}".format(pubId, revId), "yellow"))
														
 
															-print(colored("[+] found {} pages".format(len(pages)), "green"))
														
 
															-
														
 
															-print("[*] downloading pages...")
														
 
															-
														
 
															-filenames = []
														
 
															-for page in tqdm(pages):
														
 
															-    i = page["imageUri"].split('/')
														
 
															-    f = i[1]+"-"+i[3]
														
 
															-    r = s.get("https://"+page["imageUri"])
														
 
															-    open(f, "wb").write(r.content)
														
 
															-    filenames.append(f)
														
 
															-
														
 
															-print(colored("[+] downloaded {} jpg files".format(len(pages), "green")))
														
 
															-
														
 
															-print("[*] converting to single pdf...")
														
 
															-with open(outfile, "wb") as out:
														
 
															-    out.write(img2pdf.convert(filenames))
														
 
															-
														
 
															-print(colored("[+] output pdf '{}' is ready".format(colored(outfile, "yellow")), "green"))
														
 
															-
														
 
															-print("[*] cleaning up jpg files...")
														
 
															-for f in filenames:
														
 
															-    os.remove(f)
														
 
															-
														
 
															-print(colored("[+] done.", "green"))
														
 
															+
														
 
															+
														
 
															+
														
 
															+if __name__ == '__main__':
														
 
															+    app()