import gradio as gr import subprocess def nougat_ocr(file_name): # CLI Command to run cli_command = [ 'nougat', '--out', '/output', 'pdf', f'{file_name}', '--checkpoint', '/nougat' ] # Run the command and get .mmd file in an output folder subprocess.run(cli_command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True) return def predict(pdf_file): print(f"temporary file - {pdf_file.name}") pdf_name = pdf_file.name.split('/')[-1].split('.')[0] print(f"pdf file name - {pdf_name}") #! Get prediction for a PDF using nougat nougat_ocr(pdf_file.name) # Open the multimarkdown (.mmd) file for reading with open(f'/output/{pdf_name}.mmd', 'r') as file: content = file.read() return content with gr.Blocks() as demo: gr.HTML("