File size: 1,023 Bytes
02d5bc7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9d554d5
 
 
 
 
 
02d5bc7
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
import subprocess
import os

import shutil
def rename_and_move_files(root_folder):
    for foldername, subfolders, filenames in os.walk(root_folder):
        for filename in filenames:
            if filename.endswith('.md'):
                source_path = os.path.join(foldername, filename)
                dest_path = os.path.join(root_folder, filename.replace('.md', '_PDF_FILE.txt'))
                os.rename(source_path, dest_path)
                shutil.rmtree(foldername)

def process_pdf_performance(path):
    path_extracted_pdf = path+"/extracted_pdf/"
    os.makedirs(path_extracted_pdf, exist_ok=True)
    for root, dirs, files in os.walk(path):
        for file in files:
            if file.endswith('.pdf'):
                print("FILE IS ", os.path.join(root, file))
                file_proper_format = file.replace(" ", "\ ")
                os.system(f"marker_single  {os.path.join(root, file_proper_format)} {path_extracted_pdf} --batch_multiplier 10")
    rename_and_move_files(path_extracted_pdf)