|
@@ -1,22 +1,38 @@
|
|
# coding=utf8
|
|
# coding=utf8
|
|
import re
|
|
import re
|
|
|
|
|
|
-regex = r"(\S+\s{1,3}?\S*\s?\S*\S*\s?\S*\S*\s?\S*\S*\s?\S*\S*\s+)"
|
|
|
|
|
|
+regex = r"(\S+\s{1,3}?\S*\s?\S*\S*\s?\S*\S*\s?\S*\S*\s?\S*\S*\s+)" #alle gruppen von zahlen raus
|
|
regex1 = r"([A-Z]\s?\W\s?\d\d?\s?\s?\W\s?\d\d?\s?\W)" #ti get the bezeichnungen raus
|
|
regex1 = r"([A-Z]\s?\W\s?\d\d?\s?\s?\W\s?\d\d?\s?\W)" #ti get the bezeichnungen raus
|
|
regex2= r"([a-zA-Z]{3,})" #alle wörter raus???
|
|
regex2= r"([a-zA-Z]{3,})" #alle wörter raus???
|
|
|
|
+regex_isos = r"(ISO\s\d\d\d\d?\W?\d?\W?\d?\W?\d?)" #get iso standards
|
|
|
|
+reg = r"(^\d{1}$)" #einzelne Zahlen raus
|
|
|
|
+reg1 = r"(^[A-Z]-?[A-Z]?$)" #einzelne Buchstaben raus
|
|
extracted_dimensions = []
|
|
extracted_dimensions = []
|
|
-file=open('/home/bscheibel/PycharmProjects/dxf_reader/drawings/5152166_Rev04.txt', 'r')
|
|
|
|
-text= file.read()
|
|
|
|
|
|
+file = open('/home/bscheibel/PycharmProjects/dxf_reader/drawings/5129275_Rev01-GV12.txt', 'r')
|
|
|
|
+text = file.read()
|
|
file.close()
|
|
file.close()
|
|
matches = re.findall(regex, text, re.MULTILINE)
|
|
matches = re.findall(regex, text, re.MULTILINE)
|
|
for match in matches:
|
|
for match in matches:
|
|
extracted_dimensions.append(match.strip())
|
|
extracted_dimensions.append(match.strip())
|
|
-
|
|
|
|
-
|
|
|
|
|
|
+isos = []
|
|
|
|
+new_dims = []
|
|
#next part replaces everything you do not need with whitespace
|
|
#next part replaces everything you do not need with whitespace
|
|
-string = "<font x=''>test</font> <font y=''>test2</font> <font z=''>test3</font>"
|
|
|
|
-if re.search("(<font .*?>)", string, re.IGNORECASE):
|
|
|
|
- r = re.compile(r"</?font.*?>", re.IGNORECASE)
|
|
|
|
- string = r.sub(r'', string)
|
|
|
|
|
|
+for dim in extracted_dimensions:
|
|
|
|
+ if re.search(regex_isos, dim):
|
|
|
|
+ match = re.findall(regex_isos,dim)
|
|
|
|
+ isos.append(match[0])
|
|
|
|
+ dim = re.sub(regex_isos,'' ,dim)
|
|
|
|
+ if re.search(regex1, dim):
|
|
|
|
+ dim = re.sub(regex1, '', dim)
|
|
|
|
+ if re.search(regex2, dim):
|
|
|
|
+ dim = re.sub(regex2,'' ,dim)
|
|
|
|
+ if re.search(reg, dim):
|
|
|
|
+ dim = re.sub(reg,'' ,dim)
|
|
|
|
+ if re.search(reg1, dim):
|
|
|
|
+ dim = re.sub(reg1,'' ,dim)
|
|
|
|
+ if dim != '':
|
|
|
|
+ new_dims.append(dim)
|
|
|
|
|
|
-print(extracted_dimensions)
|
|
|
|
|
|
+print(isos)
|
|
|
|
+for dim in new_dims:
|
|
|
|
+ print(dim)
|