Spaces:
Sleeping
Sleeping
File size: 1,023 Bytes
02d5bc7 9d554d5 02d5bc7 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 |
import subprocess
import os
import shutil
def rename_and_move_files(root_folder):
for foldername, subfolders, filenames in os.walk(root_folder):
for filename in filenames:
if filename.endswith('.md'):
source_path = os.path.join(foldername, filename)
dest_path = os.path.join(root_folder, filename.replace('.md', '_PDF_FILE.txt'))
os.rename(source_path, dest_path)
shutil.rmtree(foldername)
def process_pdf_performance(path):
path_extracted_pdf = path+"/extracted_pdf/"
os.makedirs(path_extracted_pdf, exist_ok=True)
for root, dirs, files in os.walk(path):
for file in files:
if file.endswith('.pdf'):
print("FILE IS ", os.path.join(root, file))
file_proper_format = file.replace(" ", "\ ")
os.system(f"marker_single {os.path.join(root, file_proper_format)} {path_extracted_pdf} --batch_multiplier 10")
rename_and_move_files(path_extracted_pdf)
|