read_tables.py 372 B

123456789101112
  1. import tabula
  2. #tables = tabula.read_pdf("iso_documents/ISO1101.PDF", multiple_tables=True)
  3. #for table in tables:
  4. # print(table)
  5. #pdftotext - layout!!!!
  6. tabula.convert_into("iso_documents/ISO1101.PDF", "output.csv", output_format="csv", pages='all', multiple_tables=True)
  7. df = tabula.read_pdf("iso_documents/ISO1101.PDF", pages='all', multiple_tables=True)
  8. print(df)