Final_Code_for_Markup
Final_Code_for_Markup
###FINAL
import fitz # PyMuPDF
from PyPDF2 import PdfReader, PdfWriter
import csv
import pandas as pd
def read_search_texts_from_csv(csv_path):
with open(csv_path, 'r') as csvfile:
reader = csv.reader(csvfile)
return [row[0] for row in reader]
if __name__ == "__main__":
# Replace these variables with your actual file paths and search texts
input_pdf_loc = "/Users/sureshkadam/Documents/MY
DATA/PYHTON-WINDOWS/PYTHON/HTMLPARSER/Htmlparser/ETPDF/"
output_pdf_loc = "/Users/sureshkadam/Documents/MY DATA/PHD/DATA/MARKUP_PDF/"
csv_path = "search_texts.csv"
excel_file_path = "/Users/sureshkadam/Documents/MY
DATA/PHD/DATA/MARKUP_PDF/filestoupdate.xlsx"
df = pd.read_excel(excel_file_path)
filenames = df.iloc[:,0]
i=0
for values in filenames:
input_pdf_path = input_pdf_loc + values
output_pdf_path = output_pdf_loc + values
#print(input_pdf_path)
#print(output_pdf_path)
my_search_and_highlight(input_pdf_path, search_texts, output_pdf_path)
i = i + 1
print(str(i)+ " - "+ values)