python-geeks
diff --git a/‎watermark_removal/README.md‎
Lines changed: 15 additions & 0 deletions b/‎watermark_removal/README.md‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎watermark_removal/requirements.txt‎
Lines changed: 4 additions & 0 deletions b/‎watermark_removal/requirements.txt‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎watermark_removal/watermark_removal.py‎
Lines changed: 29 additions & 0 deletions b/‎watermark_removal/watermark_removal.py‎
Lines changed: 29 additions & 0 deletions
@@ -0,0 +1,15 @@
+# Script to remove watermark from images and pdfs
+## How to use:
+1. Call the function giving two arguments, the path to the images whose watermark is to be removed and the output path (where you want to store the cleaned images). (This script will remove the watermarks from all jpg images in the folder and store them into another folder "Cleaned")
+<br> example :-
+<br>```input_folder = "C:/User/Desktop"```
+<br>```output_folder = "C:/User/Desktop"```
+<br>```watermark_removal(input_file)```
+
+2. If you have a pdf with watermarks to be removed, you need to call the pdf_to_jpg function. This takes two arguments the input folder (where your pdf exists) and the output folder(where the images of each page will be stored).
+<br> example :-
+<br>```input_folder = "C:/User/Desktop"```
+<br>```output_folder = "C:/User/Desktop"```
+<br>```pdf_to_jpg(input_folder, output_folder)```
+
+3. After calling the pdf function you can call the watermark_removal function to remove the watermarks from the pdf.
@@ -0,0 +1,4 @@
+opencv-python
+pdf2image
+glob
+numpy
@@ -0,0 +1,29 @@
+import numpy as np
+import glob
+import cv2
+from pdf2image import convert_from_path
+
+
+def pdf_to_jpg(path_to_folder, output_path):
+
+ for pdf in glob.glob(path_to_folder + "/*.pdf"):
+ pages = convert_from_path(pdf, 500)
+ i = 0
+
+ for page in pages:
+ page.save(output_path + "/image%04i.jpg" % i, 'JPEG')
+ i += 1
+
+
+def watermark_removal(path_to_folder, output_path):
+ i = 0
+ alpha = 2.0
+ beta = -160
+
+ for img1 in glob.glob(path_to_folder + "/*.jpg"):
+ originalimage = cv2.imread(img1)
+ imgGrayscale = cv2.cvtColor(originalimage, cv2.COLOR_BGR2GRAY)
+ imgcleaned = alpha * imgGrayscale + beta
+ imgcleaned = np.clip(imgcleaned, 0, 255).astype(np.uint8)
+ cv2.imwrite("Cleaned/image%03i.jpg" % i, imgcleaned)
+ i += 1
-Original file line number
+Diff line change
@@ @@ -0,0 +1,4 @@ @@
 +opencv-python
 +pdf2image
 +glob
 +numpy