Browse Source

tried table extraction

beatescheibel 4 years ago
parent
commit
4b73861ebe

File diff suppressed because it is too large
+ 3912 - 10
iso_documents/ISO2768-1.html


iso_documents/ISO 2768-2.PDF → iso_documents/ISO2768-2.PDF


+ 0 - 67
output_mit_camelot-page-3-table-1.csv

@@ -1,67 +0,0 @@
-"Toleran
-zklasse
-Benennung
-Kurzzeichen","","Nennmaßb
-ereiche
-Grenzal
-bmaße für 1
-über 1000
-von 0,5^)
-über 120
-über 400
-über 3
-über 6
-über 30
-über 2000
-bis 6
-bis 2000
-bis 3
-bis 400
-bis 1000
-bis 4000
-bis 30
-bis 120
-CO
-o
-o","","","","","","",""
-"f
-fein","","CO
-±0,3
-±0,5
-±0,05
-±0,2
-—
-±0,05
-±0,1
-±0,15
-+1
-+1","","","","","","",""
-"m
-mittel","","±0,8
-±2
-±0,1
-±0,2
-±0,5
-±0,1
-±0,3
-± 1,2","","","","","","",""
-"c
-grob","","±3
-±1,2
-±2
-±4
-±0,2
-±0,3
-±0,5
-±0,8","","","","","","",""
-"V
-sehr grob","","±4
-±6
-±2,5
-±8
-—
-±0,5
-±1
-±1,5","","","","","","",""
-"^) Für Nennmaße unter 0,5 mm sind die Grenzabmaße direkt an dem (den) entsprechenden Nennmaß(en) anzugeben.","","","","","","","","",""

+ 0 - 18
output_mit_camelot-page-3-table-2.csv

@@ -1,18 +0,0 @@
-"Toleran
-zklasse
-Benennung
-Kurzzeichen","","iche
-Grei
-izabmaße für Nennmaßbere
-über 6
-von 0,5^) bis 3
-über 3 bis 6","",""
-"f
-fein","","±0,2","±0,5","± 1"
-"m
-mittel","","","",""
-"c
-grob","","±0,4","± 1","±2"
-"V
-sehr grob","","","",""
-"^) Für Nennmaße unter 0,5 mm sind die Grenzabmaße direkt an dem (den) entsprechenden Nennmaß(en) anzugeben.","","","",""

+ 0 - 32
output_mit_camelot-page-3-table-3.csv

@@ -1,32 +0,0 @@
-"Toleran
-zklasse
-Benennung
-Kurzzeichen","","ir Längenbereichi
-e, in mm, für den
-Grenzabmaße fC
->nden Winkels
-kürzeren Sch(
-3nkel des betreffe
-bis 10
-über 120
-über 400
-über 10
-über 50
-bis 50
-bis 400
-bis 120","","","",""
-"fein
-f","","± 1°
-± 0° 30'
-±0° 10'","","","","±0°5'"
-"m
-mittel","","","","","",""
-"c
-grob","","±0° 10'
-± 1°
-± 0° 30'
-±0° 15'","","","",""
-"V
-sehr grob","","±2°
-±1°
-±0° 20'","","","",""

+ 7 - 0
pdf_table_extractor.py

@@ -0,0 +1,7 @@
+import camelot
+import matplotlib.pyplot as plt
+tables = camelot.read_pdf('/Users/beatescheibel/PycharmProjects/dxf_reader/iso_documents/ISO2768-1.PDF', pages="3",line_scale=70, line_tol=2, joint_tol=35)
+tables.export('foo.csv', f='csv')
+print(tables[0].df)
+camelot.plot(tables[0], kind='grid')
+plt.show()