Extracting Datatable in a PDF

I have done this by using python in the past.

from tabula import read_pdf
import pandas as pd
import os

# Path to your PDF file
pdf_path = 'INPUT'

# Define your static output folder
output_folder = 'OUTPUTFOLDER'

# Check if the output folder exists, create it if it doesn't
if not os.path.exists(output_folder):
    os.makedirs(output_folder)

# Use read_pdf function with pages="all" to extract tables from all pages
tables = read_pdf(pdf_path, pages="all", multiple_tables=True)

# Iterate over each table (DataFrame) and process or save it
for i, table in enumerate(tables):
    # Define the path for each output CSV file within the output folder
    output_path = os.path.join(output_folder, f"FILENAME_{i+1}.csv")
    # Save each table to a CSV file in the specified output folder
    table.to_csv(output_path, index=False)from tabula import read_pdf
import pandas as pd
import os

# Path to your PDF file
pdf_path = 'INPUT'

# Define your static output folder
output_folder = 'OUTPUTFOLDER'

# Check if the output folder exists, create it if it doesn't
if not os.path.exists(output_folder):
    os.makedirs(output_folder)

# Use read_pdf function with pages="all" to extract tables from all pages
tables = read_pdf(pdf_path, pages="all", multiple_tables=True)

# Iterate over each table (DataFrame) and process or save it
for i, table in enumerate(tables):
    # Define the path for each output CSV file within the output folder
    output_path = os.path.join(output_folder, f"FILENAME_{i+1}.csv")
    # Save each table to a CSV file in the specified output folder
    table.to_csv(output_path, index=False)