nagrest/lib/nag_parse.py

98 lines
4.1 KiB
Python
Raw Normal View History

2022-03-25 18:07:23 +01:00
#!/usr/bin/env python3
import re
2022-03-29 11:46:21 +02:00
import json
import hashlib
2022-03-25 18:07:23 +01:00
from enum import Enum, auto
2022-03-30 11:53:56 +02:00
from .nag_object import NagObject, NagObjectType
2022-03-28 10:01:36 +02:00
2022-03-25 18:07:23 +01:00
class ParserState(Enum):
2022-03-28 20:10:32 +02:00
COMMENT = auto()
2022-03-25 18:07:23 +01:00
DEFINE = auto()
DIRECTIVE = auto()
MULTILINE = auto()
2022-03-29 11:46:21 +02:00
def hash_string(string:str) -> int:
hash = hashlib.sha256()
hash.update(string.encode('utf-8'))
digest = hash.hexdigest()
return int(digest,16) * 1000000
2022-03-25 18:07:23 +01:00
class NagParse:
2022-03-30 11:53:56 +02:00
def __init__(self):
2022-03-29 11:46:21 +02:00
self.m_config_table: dict[int,str] = dict()
2022-03-28 20:11:06 +02:00
self.m_objects: list[NagObject] = list()
2022-03-30 11:53:56 +02:00
2022-03-29 11:46:21 +02:00
2022-03-25 18:07:23 +01:00
def __str__(self):
string = str()
2022-03-28 20:11:06 +02:00
for object in self.m_objects:
string += str(object) + "\n"
2022-03-25 18:07:23 +01:00
return string
2022-03-30 11:53:56 +02:00
def consume_config_files(self, config_files: list[str]) -> None:
for config_file in config_files:
self.m_config_table[hash_string(config_file)] = config_file
for object in self.parse_config(config_file):
self.m_objects.append(object)
def consume_config_list(self, config_list: list[dict] ) -> None:
for object in config_list:
nag_object = NagObject()
nag_object.from_object(object)
self.m_objects.append(nag_object)
2022-03-29 11:47:04 +02:00
def to_json(self):
return json.dumps([x.to_object() for x in self.m_objects])
2022-03-25 18:07:23 +01:00
2022-03-28 10:01:36 +02:00
def parse_config(self,config_file: str) -> list[NagObject]:
2022-03-25 18:07:23 +01:00
state = ParserState.DEFINE
2022-03-28 10:01:36 +02:00
objects: list[NagObject] = list()
2022-03-25 18:07:23 +01:00
with open(config_file, 'r') as file_handle:
line_no = 0
2022-03-28 10:01:36 +02:00
cur_object = NagObject(config_file=config_file)
2022-03-25 18:07:23 +01:00
for rawline in file_handle.readlines():
2022-03-28 10:01:36 +02:00
# Clean up the config
2022-03-25 18:07:23 +01:00
line = re.sub(r'([a-z]){', r'\1 {',rawline.strip())
2022-03-28 10:01:36 +02:00
#line = re.sub(r'([a-zA-Z0-9])}', r'\1\n}',line.strip())
#line = re.sub(r'([a-zA-Z0-9]) }', r'\1\n}',line.strip())
2022-03-25 18:07:23 +01:00
line_no += 1
2022-03-28 10:01:36 +02:00
# This means it is a comment, we might want to save those later on
if len(line) == 0 or re.match('^[\t ]*[#]+', line):
2022-03-25 18:07:23 +01:00
continue
2022-03-28 10:01:36 +02:00
# This means we are done parsing and should reset for new object
2022-03-25 18:07:23 +01:00
if re.match(r'}', line):
objects.append(cur_object)
2022-03-28 10:01:36 +02:00
del cur_object
2022-03-25 18:07:23 +01:00
state = ParserState.DEFINE
continue
2022-03-28 10:01:36 +02:00
#if we get here it is not a comment and not the end of an object
2022-03-25 18:07:23 +01:00
fragments: list[str] = re.sub(' +', ' ', line.strip()).split()
2022-03-28 10:01:36 +02:00
# This is a new object and we should see what type it is, and what line number it is on
2022-03-25 18:07:23 +01:00
if state == ParserState.DEFINE:
if fragments[0] == 'define':
2022-03-28 10:01:36 +02:00
cur_object = NagObject(config_file=config_file, directives=list())
2022-03-25 18:07:23 +01:00
cur_object.m_line_no = line_no
2022-03-28 10:01:36 +02:00
cur_object.m_type = NagObjectType(fragments[1])
# For the next line we should be in DIRECTIVE state
2022-03-25 18:07:23 +01:00
state = ParserState.DIRECTIVE
else:
2022-03-28 10:01:36 +02:00
print("It's fucked up man")
break
# This is the DIRECTIVE state, where we want to collect key, values and find out if we should go to multiline mode
elif state == ParserState.DIRECTIVE:
if fragments[-1][-1] == '\\':
2022-03-25 18:07:23 +01:00
state = ParserState.MULTILINE
if re.match('^[a-z]+', fragments[0]):
cur_object.m_directives.append(
2022-03-28 10:01:36 +02:00
[fragments[0], " ".join(fragments[1:])])
# This is the MULTILINE state, directives can be on many lines if the '\n' is escaped with '\'
elif state == ParserState.MULTILINE:
cur_object.m_directives[-1][1] = cur_object.m_directives[-1][1].strip('\\') + ' ' + " ".join(fragments)
if fragments[-1][-1] != '\\':
state = ParserState.DIRECTIVE
else:
print("It's fucked up man")
break
2022-03-25 18:07:23 +01:00
return objects