pycrate/pycrate_asn1dir/3GPP_NR_F1AP_38473/extract.py

70 lines
1.9 KiB
Python

# -*- coding: UTF-8 -*-
# 1) convert all 36XYZ-$release.doc files to text files in utf-8 format with MS Office
# 2) use this script to extract all ASN.1 modules
import codecs
import re
dirpath = './'
path = dirpath + '38473-f80.txt'
# ASN.1 modules are described within specific sections
sections = [
'9.4.3 Elementary Procedure Definitions',
'9.4.4 PDU Definitions',
'9.4.5 Information Element Definitions',
'9.4.6 Common Definitions',
'9.4.7 Constant Definitions',
'9.4.8 Container Definitions'
]
module_def = re.compile('^([A-Z][a-zA-Z0-9\-]{0,})\s{0,}')
def main():
fd = codecs.open(path, 'r', 'utf-8')
speclines = fd.readlines()
fd.close()
#print(len(speclines))
inside, start = False, False
module = []
module_name = None
for line in speclines:
if line[:-1] in sections:
if inside:
raise(Exception('ASN.1 extraction failed: %s' % line))
inside, start = True, True
elif line[:-1] == 'END':
module.append(line)
inside = False
print('%s.asn' % module_name)
fd = codecs.open(dirpath + module_name + '.asn', 'w', 'utf-8')
fd.write( ''.join(module) )
fd.close()
module = []
module_name = None
else:
if inside:
#print('inside')
if start:
#print('start')
m = module_def.match(line)
if m:
module_name = m.group(1)
start = False
#print(module_name)
elif not re.match('^\s{0,}$', line) and line[:2] != '--':
start = False
# inside a module: storing the line
module.append(line)
print('> extraction done')
return 0
if __name__ == '__main__':
main()