Add files via upload

vivekthedev · web-flow · commit 38ec8133650e · 2022-01-23T12:32:46.000+05:30
diff --git a/GUIScripts/Slideshare to PDF/README.md b/GUIScripts/Slideshare to PDF/README.md
@@ -0,0 +1,45 @@
+# Slideshare to PDF
+
+## Aim
+
+The main aim of this script is to get a PDF file from the slideshare presentaion link.
+
+## Purpose
+
+To download a presentation from slideshare we have to sign up to scribd, but with this script you can download any presentation from the slideshare without any signup, provided that you have a good internet connection.
+
+## Short description of package/script
+
+The script uses PIL, requests, beautifulsoup, modules to scrape the images from the presentation and then convert it to a pdf file.
+The success rate of the script depends on the speed of your internet connection, so for the best results try connecting to a good network.
+
+## Setup instructions
+
+To install the dependencies
+
+`pip install -r requirements.txt`
+
+To try the script
+
+`python main.py`
+
+- A GUI will open up, enter your link, press _Get PDF_
+- Wait until it shows file downloaded successfully in the bottom of the GUI window.
+- After the success message, your file should be in the current working diirectory.
+
+## Output
+
+### Main Window:
+
+![](./Images/window.png)
+<br/>
+
+### Downloaded file:
+
+![](./Images/Output.png)
+
+## Author(s)
+
+[Vivek](https://github.com/vivekthedev)
+
+Questions? [Twitter](https://twitter.com/vivekthedev)
diff --git a/GUIScripts/Slideshare to PDF/main.py b/GUIScripts/Slideshare to PDF/main.py
@@ -0,0 +1,90 @@
+# Built in modules
+import io
+from tkinter import *
+import pathlib
+
+# External Modules
+import requests
+from bs4 import BeautifulSoup
+import PIL.Image
+import validators
+
+# Get Current Working Directory path
+path = pathlib.Path().resolve()
+
+
+def get_pdf():
+    URL = url_var.get()
+
+    # Only perform scraping if the url is valid.
+    if validators.url(URL):
+        r = requests.get(URL)
+        soup = BeautifulSoup(r.content, "html5lib")
+        imgs = soup.find_all("img", class_="slide-image")
+
+        # Get every image with class slide-image
+        imgs = soup.find_all("img", class_="slide-image")
+
+        # Strip out preferred image resolution from the srcset of the img tag
+        imgSRC = [
+            x.get("srcset").split(",")[-1].strip().split(" ")[0].split("?")[0]
+            for x in imgs
+        ]
+
+        # List to store all the image objects
+        imagesJPG = []
+
+        for index, link in enumerate(imgSRC):
+            try:
+                # Get image content from the image url
+                im = requests.get(link)
+
+                # Convert that image content to a BytesIO file object which is in-memory object,
+                # so we don't have to download the image.
+                f = io.BytesIO(im.content)
+
+                # Converting that BytesIO object to Image Object for PIL to convert it in PDF
+                imgJPG = PIL.Image.open(f)
+                imagesJPG.append(imgJPG)
+
+            except Exception as e:
+                # Program will fail if the request isn't able to make a proper connection
+                info_label_2.configure(text="Some Connection ERROR")
+
+        # Appending all the images object after the first image and exporting it as a PDF in cwd.
+        imagesJPG[0].save(
+            f"{soup.title.string}.pdf", save_all=True, append_images=imagesJPG[1:]
+        )
+        info_label_2.configure(text=f"File Downloaded to\n{path}")
+    else:
+        info_label_2.configure(text=f"Please provide a valid link")
+
+
+# Basic Tkinter window setup
+base = Tk()
+base.geometry("300x300")
+base.title("Slideshare to PDF")
+base.resizable(False, False)
+base.configure(background="aliceblue")
+
+# Variable to store user's link and a  entry field,
+# a button and a label
+url_var = StringVar()
+val_entry = Entry(base, textvariable=url_var, width="30")
+val_entry.place(x=50, y=50)
+
+button = Button(
+    base, text="Get PDF", command=get_pdf, width="25", height="2", bg="grey"
+)
+button.place(x=50, y=100)
+info_label = Label(
+    base,
+    text="Enter the presentaion link\nMake sure to have a good internet connection.",
+)
+
+# label to show error and success message to the user
+info_label_2 = Label(base, text="")
+
+info_label.place(x=35, y=200)
+info_label_2.place(x=50, y=250)
+base.mainloop()
diff --git a/GUIScripts/Slideshare to PDF/requirements.txt b/GUIScripts/Slideshare to PDF/requirements.txt
@@ -0,0 +1,14 @@
+beautifulsoup4==4.10.0
+bs4==0.0.1
+certifi==2021.10.8
+charset-normalizer==2.0.10
+decorator==5.1.1
+html5lib==1.1
+idna==3.3
+Pillow==9.0.0
+requests==2.27.1
+six==1.16.0
+soupsieve==2.3.1
+urllib3==1.26.8
+validators==0.18.2
+webencodings==0.5.1