File size: 633 Bytes
e730543 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 |
import torch
from transformers import AutoModelForObjectDetection, TableTransformerForObjectDetection
from PIL import Image, ImageDraw
import matplotlib.pyplot as plt
import matplotlib.patches as patches
from torchvision import transforms
import numpy as np
import pandas as pd
import easyocr
from tqdm.auto import tqdm
import cv2
import os
from pdf2image import convert_from_path
from pdf_processing import process_pdf
if __name__ == "__main__":
pdf_path = "./PDF2TEXT-UDP/input/financial_statements.pdf" # Path to your PDF
output_folder = "./PDF2TEXT-UDP/output" # Output folder
process_pdf(pdf_path, output_folder)
|