'''
Utilities to analyze tomb output
'''
import re

#found: [m] followed by some ID (usually "found") inside square brackets, then
#something else, then a space, then the content
_found_regex = re.compile(r'^\[m\]\[([^]]+)\] +(([^:]+)://(.+))$')
#generic: programname, then some identifiers in square (or round) brackets,
#then maybe something else, then a space, then the context
_generic_regex = re.compile(r'^[a-z-]+ [[(]([^]]+)[\])] +(.+)$')
types = {'E': 'error', 'W': 'warning', 'D': 'debug', '*': 'success'}


def parse_line(line):
    '''Analyze a single line.
    Return None if no standard format is detected, a dict otherwise.
    The fields 'type' and 'content' are always in the dict; 'content' may be
    empty
    'type' can be 'error', 'progress'
    '''

    match = _found_regex.match(line)
    if match:
        return {'type': types.get(match.group(1)) or match.group(1),
                'content': match.group(2), 'scheme': match.group(3),
                'path': match.group(4)}
    match = _generic_regex.search(line)
    if match:
        return {'type': types.get(match.group(1)) or match.group(1),
                'content': match.group(2)}

    return None