2011-11-03 00:00:48 +01:00
|
|
|
'''
|
|
|
|
Utilities to analyze tomb output
|
|
|
|
'''
|
|
|
|
import re
|
|
|
|
|
2012-01-28 04:15:23 +01:00
|
|
|
#found: [m] followed by some ID (usually "found") inside square brackets, then
|
|
|
|
#something else, then a space, then the content
|
|
|
|
_found_regex = re.compile(r'^\[m\]\[([^]]+)\] +(([^:]+)://(.+))$')
|
|
|
|
#generic: programname, then some identifiers in square (or round) brackets,
|
|
|
|
#then maybe something else, then a space, then the context
|
|
|
|
_generic_regex = re.compile(r'^[a-z-]+ [[(]([^]]+)[\])] +(.+)$')
|
|
|
|
types = {'E':'error', 'W':'warning', 'D':'debug', '*':'success'}
|
2011-11-03 00:00:48 +01:00
|
|
|
def parse_line(line):
|
|
|
|
'''Analyze a single line.
|
|
|
|
Return None if no standard format is detected, a dict otherwise.
|
|
|
|
The fields 'type' and 'content' are always in the dict; 'content' may be
|
|
|
|
empty
|
|
|
|
'type' can be 'error', 'progress'
|
|
|
|
'''
|
|
|
|
|
2012-01-28 04:15:23 +01:00
|
|
|
|
|
|
|
match = _found_regex.match(line)
|
|
|
|
if match:
|
|
|
|
return { 'type': types.get(match.group(1)) or match.group(1),
|
|
|
|
'content': match.group(2), 'scheme': match.group(3),
|
|
|
|
'path': match.group(4) }
|
|
|
|
match = _generic_regex.search(line)
|
2011-11-03 00:00:48 +01:00
|
|
|
if match:
|
2012-01-28 04:15:23 +01:00
|
|
|
return { 'type': types.get(match.group(1)) or match.group(1),
|
|
|
|
'content': match.group(2) }
|
|
|
|
|
2011-11-03 00:00:48 +01:00
|
|
|
return None
|
|
|
|
|
|
|
|
|