grepros/api/search_8py_source.html

# -*- coding: utf-8 -*-

"""

Search core.


------------------------------------------------------------------------------

This file is part of grepros - grep for ROS bag files and live topics.

Released under the BSD License.


@author      Erki Suurjaak

@created     28.09.2021

@modified    24.03.2024

------------------------------------------------------------------------------

"""

## @namespace grepros.search

from argparse import Namespace

import copy

import collections

import functools

import logging

import re


import six


from . import api

from . import common

from . import inputs


class Scanner(object):

    """

    ROS message grepper.


    In highlighted results, message field values that match search criteria are modified

    to wrap the matching parts in {@link grepros.common.MatchMarkers MatchMarkers} tags,

    with numeric field values converted to strings beforehand.

    """


    GrepMessage = collections.namedtuple("BagMessage", "topic message timestamp match index")


    ANY_MATCHES = [((), re.compile("(.*)", re.DOTALL)), (), re.compile("(.?)", re.DOTALL)]


    DEFAULT_ARGS = dict(PATTERN=(), CASE=False, FIXED_STRING=False, INVERT=False, EXPRESSION=False,

                        HIGHLIGHT=False, NTH_MATCH=1, BEFORE=0, AFTER=0, CONTEXT=0, MAX_COUNT=0,

                        MAX_PER_TOPIC=0, MAX_TOPICS=0, SELECT_FIELD=(), NOSELECT_FIELD=(),

                        MATCH_WRAPPER="**")


    def __init__(self, args=None, **kwargs):

        """

        @param   args                     arguments as namespace or dictionary, case-insensitive

        @param   args.pattern             pattern(s) to find in message field values

        @param   args.fixed_string        pattern contains ordinary strings, not regular expressions

        @param   args.case                use case-sensitive matching in pattern

        @param   args.invert              select messages not matching pattern

        @param   args.expression          pattern(s) are a logical expression

                                          like 'this AND (this2 OR NOT "skip this")',

                                          with elements as patterns to find in message fields

        @param   args.highlight           highlight matched values

        @param   args.before              number of messages of leading context to emit before match

        @param   args.after               number of messages of trailing context to emit after match

        @param   args.context             number of messages of leading and trailing context to emit

                                          around match, overrides args.before and args.after

        @param   args.max_count           number of matched messages to emit (per file if bag input)

        @param   args.max_per_topic       number of matched messages to emit from each topic

        @param   args.max_topics          number of topics to emit matches from

        @param   args.nth_match           emit every Nth match in topic, starting from first

        @param   args.select_field        message fields to use in matching if not all

        @param   args.noselect_field      message fields to skip in matching

        @param   args.match_wrapper       string to wrap around matched values in find() and match(),

                                          both sides if one value, start and end if more than one,

                                          or no wrapping if zero values (default "**")

        @param   kwargs                   any and all arguments as keyword overrides, case-insensitive

        <!--sep-->


        Additional arguments when using match() or find(grepros.api.Bag):


        @param   args.topic               ROS topics to read if not all

        @param   args.type                ROS message types to read if not all

        @param   args.skip_topic          ROS topics to skip

        @param   args.skip_type           ROS message types to skip

        @param   args.start_time          earliest timestamp of messages to read

        @param   args.end_time            latest timestamp of messages to read

        @param   args.start_index         message index within topic to start from

        @param   args.end_index           message index within topic to stop at

        @param   args.unique              emit messages that are unique in topic

        @param   args.nth_message         read every Nth message in topic, starting from first

        @param   args.nth_interval        minimum time interval between messages in topic,

                                          as seconds or ROS duration

        @param   args.condition           Python expressions that must evaluate as true

                                          for message to be processable, see ConditionMixin

        @param   args.progress            whether to print progress bar

        @param   args.stop_on_error       stop execution on any error like unknown message type

        """

        # {key: [(() if any field else ('nested', 'path') or re.Pattern, re.Pattern), ]}

        self._patterns = {}

        self._expressor = ExpressionTree()

        self._expression = None # Nested [op, val] like ["NOT", ["VAL", "skip this"]]

        # {(topic, typename, typehash): {message ID: message}}

        self._messages = collections.defaultdict(collections.OrderedDict)

        # {(topic, typename, typehash): {message ID: ROS time}}

        self._stamps   = collections.defaultdict(collections.OrderedDict)

        # {(topic, typename, typehash): {None: processed, True: matched, False: emitted as context}}

        self._counts   = collections.defaultdict(collections.Counter)

        # {(topic, typename, typehash): {message ID: True if matched else False if emitted else None}}

        self._statuses = collections.defaultdict(collections.OrderedDict)

        # Patterns to check in message plaintext and skip full matching if not found

        self._brute_prechecks = []     # [re.Pattern to match against message fulltext for early skip]

        self._idcounter       = 0      # Counter for unique message IDs

        self._settings = {             # Various cached settings

            "highlight":       None,   # Highlight matched values in message fields

            "passthrough":     False,  # Emit messages without pattern-matching and highlighting

            "pure_anymatch":   False,  # Simple match for any content

            "wraps":           [],     # Match wrapper start-end strings

        }


        self.source = None


        self.sink   = None


        self.valid = None


        self.args0 = common.ensure_namespace(args, **kwargs)

        self.args = common.ArgumentUtil.validate(common.ensure_namespace(args, Scanner.DEFAULT_ARGS, **kwargs))

        if self.args.CONTEXT: self.args.BEFORE = self.args.AFTER = self.args.CONTEXT


    def find(self, source, highlight=None):

        """

        Yields matched and context messages from source.


        @param   source     inputs.Source or api.Bag instance

        @param   highlight  whether to highlight matched values in message fields,

                            defaults to flag from constructor

        @return             GrepMessage namedtuples of

                            (topic, message, timestamp, match, index in topic),

                            where match is matched optionally highlighted message

                            or `None` if yielding a context message

        """

        if not self.validate(reset=True):

            return

        if isinstance(source, api.Bag):

            source = inputs.BagSource(source, **vars(self.args))

        self._prepare(source, highlight=highlight, progress=True)

        for topic, msg, stamp, matched, index in self._generate():

            yield self.GrepMessage(topic, msg, stamp, matched, index)


    def match(self, topic, msg, stamp, highlight=None):

        """

        Returns matched message if message matches search filters.


        @param   topic      topic name

        @param   msg        ROS message

        @param   stamp      message ROS timestamp

        @param   highlight  whether to highlight matched values in message fields,

                            defaults to flag from constructor

        @return             original or highlighted message on match else `None`

        """

        result = None

        if not self.validate(reset=True):

            return result

        if isinstance(self.source, inputs.AppSource): self._configure_settings(highlight=highlight)

        else: self._prepare(inputs.AppSource(self.args), highlight=highlight)


        self.source.push(topic, msg, stamp)

        item = self.source.read_queue()

        if item is not None:

            msgid = self._idcounter = self._idcounter + 1

            topickey = api.TypeMeta.make(msg, topic).topickey

            self._register_message(topickey, msgid, msg, stamp)

            matched = self._is_processable(topic, msg, stamp) and self.get_match(msg)


            self.source.notify(matched)

            if matched and not self._counts[topickey][True] % (self.args.NTH_MATCH or 1):

                self._statuses[topickey][msgid] = True

                self._counts[topickey][True] += 1

                result = matched

            elif matched:  # Not NTH_MATCH, skip emitting

                self._statuses[topickey][msgid] = True

                self._counts[topickey][True] += 1

            self._prune_data(topickey)

            self.source.mark_queue(topic, msg, stamp)

        return result


    def work(self, source, sink):

        """

        Greps messages yielded from source and emits matched content to sink.


        @param   source  inputs.Source or api.Bag instance

        @param   sink    outputs.Sink instance

        @return          count matched

        """

        if not self.validate(reset=True):

            return

        if isinstance(source, api.Bag):

            source = inputs.BagSource(source, **vars(self.args))

        self._prepare(source, sink, highlight=self.args.HIGHLIGHT, progress=True)

        total_matched = 0

        for topic, msg, stamp, matched, index in self._generate():

            sink.emit_meta()

            sink.emit(topic, msg, stamp, matched, index)

            total_matched += bool(matched)

        return total_matched


    def validate(self, reset=False):

        """Returns whether conditions have valid syntax, prints errors."""

        if self.valid is not None and not reset: return self.valid


        errors = collections.defaultdict(list)  # {category: [error, ]}

        if not self.args.FIXED_STRING and not self.args.EXPRESSION:

            for v in self.args.PATTERN:  # Pre-check patterns before parsing for full error state

                split = v.find("=", 1, -1)  # May be "PATTERN" or "attribute=PATTERN"

                v = v[split + 1:] if split > 0 else v

                try: re.compile(re.escape(v) if self.args.FIXED_STRING else v)

                except Exception as e:

                    errors["Invalid regular expression"].append("'%s': %s" % (v, e))

        try: self._parse_patterns()

        except Exception as e: errors[""].append(str(e))


        for err in errors.get("", []):

            common.ConsolePrinter.log(logging.ERROR, err)

        for category in filter(bool, errors):

            common.ConsolePrinter.log(logging.ERROR, category)

            for err in errors[category]:

                common.ConsolePrinter.log(logging.ERROR, "  %s" % err)


        self.valid = not errors

        return self.valid


    def __enter__(self):

        """Context manager entry, does nothing, returns self."""

        return self


    def __exit__(self, exc_type, exc_value, traceback):

        """Context manager exit, does nothing."""

        return self


    def _generate(self):

        """

        Yields matched and context messages from source.


        @return  tuples of (topic, msg, stamp, matched optionally highlighted msg, index in topic)

        """

        batch_matched, batch = False, None

        for topic, msg, stamp in self.source.read():

            if batch != self.source.get_batch():

                batch, batch_matched = self.source.get_batch(), False

                if self._counts: self._clear_data()


            msgid = self._idcounter = self._idcounter + 1

            topickey = api.TypeMeta.make(msg, topic).topickey

            self._register_message(topickey, msgid, msg, stamp)

            matched = self._is_processable(topic, msg, stamp) and self.get_match(msg)


            self.source.notify(matched)

            if matched and not self._counts[topickey][True] % (self.args.NTH_MATCH or 1):

                self._statuses[topickey][msgid] = True

                self._counts[topickey][True] += 1

                for x in self._generate_context(topickey, before=True): yield x

                yield (topic, msg, stamp, matched, self._counts[topickey][None])

            elif matched:  # Not NTH_MATCH, skip emitting

                self._statuses[topickey][msgid] = True

                self._counts[topickey][True] += 1

            elif self.args.AFTER \

            and self._has_in_window(topickey, self.args.AFTER + 1, status=True):

                for x in self._generate_context(topickey, before=False): yield x

            batch_matched = batch_matched or bool(matched)


            self._prune_data(topickey)

            if batch_matched and self._is_max_done():

                if self.sink: self.sink.flush()

                self.source.close_batch()


    def _is_processable(self, topic, msg, stamp):

        """

        Returns whether processing current message in topic is acceptable:

        that topic or total maximum count has not been reached,

        and current message in topic is in configured range, if any.

        """

        topickey = api.TypeMeta.make(msg, topic).topickey

        if self.args.MAX_COUNT \

        and sum(x[True] for x in self._counts.values()) >= self.args.MAX_COUNT:

            return False

        if self.args.MAX_PER_TOPIC and self._counts[topickey][True] >= self.args.MAX_PER_TOPIC:

            return False

        if self.args.MAX_TOPICS:

            topics_matched = [k for k, vv in self._counts.items() if vv[True]]

            if topickey not in topics_matched and len(topics_matched) >= self.args.MAX_TOPICS:

                return False

        if self.source \

        and not self.source.is_processable(topic, msg, stamp, self._counts[topickey][None]):

            return False

        return True


    def _generate_context(self, topickey, before=False):

        """Yields before/after context for latest match."""

        count = self.args.BEFORE + 1 if before else self.args.AFTER

        candidates = list(self._statuses[topickey])[-count:]

        current_index = self._counts[topickey][None]

        for i, msgid in enumerate(candidates) if count else ():

            if self._statuses[topickey][msgid] is None:

                idx = current_index + i - (len(candidates) - 1 if before else 1)

                msg, stamp = self._messages[topickey][msgid], self._stamps[topickey][msgid]

                self._counts[topickey][False] += 1

                yield topickey[0], msg, stamp, None, idx

                self._statuses[topickey][msgid] = False


    def _clear_data(self):

        """Clears local structures."""

        for d in (self._counts, self._messages, self._stamps, self._statuses):

            d.clear()

        api.TypeMeta.clear()


    def _prepare(self, source, sink=None, highlight=None, progress=False):

        """Clears local structures, binds and registers source and sink, if any."""

        self._clear_data()

        self.source, self.sink = source, sink

        source.bind(sink), sink and sink.bind(source)

        source.preprocess = False

        self._configure_settings(highlight=highlight, progress=progress)


    def _prune_data(self, topickey):

        """Drops history older than context window."""

        WINDOW = max(self.args.BEFORE, self.args.AFTER) + 1

        for dct in (self._messages, self._stamps, self._statuses):

            while len(dct[topickey]) > WINDOW:

                msgid = next(iter(dct[topickey]))

                value = dct[topickey].pop(msgid)

                dct is self._messages and api.TypeMeta.discard(value)


    def _parse_patterns(self):

        """Parses pattern arguments into re.Patterns. Raises on invalid pattern."""

        NOBRUTE_SIGILS = r"\A", r"\Z", "?("  # Regex specials ruling out brute precheck

        BRUTE, FLAGS = not self.args.INVERT, re.DOTALL | (0 if self.args.CASE else re.I)

        self._patterns.clear()

        self._expression = None

        del self._brute_prechecks[:]

        contents = []


        def make_pattern(v):

            """Returns (path Pattern or (), value Pattern)."""

            split = v.find("=", 1, -1)

            v, path = (v[split + 1:], v[:split]) if split > 0 else (v, ())

            # Special case if '' or "": add pattern for matching empty string

            v = "|^$" if v in ("''", '""') else (re.escape(v) if self.args.FIXED_STRING else v)

            path = re.compile(r"(^|\.)%s($|\.)" % ".*".join(map(re.escape, path.split("*")))) \

                   if path else ()

            try: return (path, re.compile("(%s)" % v, FLAGS))

            except Exception as e:

                raise ValueError("Invalid regular expression\n  '%s': %s" % (v, e))


        if self.args.EXPRESSION and self.args.PATTERN:

            self._expression = self._expressor.parse(" ".join(self.args.PATTERN), make_pattern)

        for v in self.args.PATTERN if not self._expression else ():

            contents.append(make_pattern(v))

            if BRUTE and (self.args.FIXED_STRING or not any(x in v for x in NOBRUTE_SIGILS)):

                if self.args.FIXED_STRING: v = re.escape(v)

                self._brute_prechecks.append(re.compile(v, re.I | re.M))

        if not self.args.PATTERN:  # Add match-all pattern

            contents.append(self.ANY_MATCHES[0])

        self._patterns["content"] = contents


        selects, noselects = self.args.SELECT_FIELD, self.args.NOSELECT_FIELD

        for key, vals in [("select", selects), ("noselect", noselects)]:

            self._patterns[key] = [(tuple(v.split(".")), common.path_to_regex(v)) for v in vals]


    def _register_message(self, topickey, msgid, msg, stamp):

        """Registers message with local structures."""

        self._counts[topickey][None] += 1

        self._messages[topickey][msgid] = msg

        self._stamps  [topickey][msgid] = stamp

        self._statuses[topickey][msgid] = None


    def _configure_settings(self, highlight=None, progress=False):

        """Caches settings for message matching."""

        highlight = bool(highlight if highlight is not None else self.args.HIGHLIGHT

                         if not self.sink or self.sink.is_highlighting() else False)

        pure_anymatch = not self.args.INVERT and not self._patterns["select"] \

                        and set(self._patterns["content"]) <= set(self.ANY_MATCHES)

        no_matching = pure_anymatch and not self._expression and not self._patterns["noselect"]

        passthrough = no_matching and not highlight  # No message processing at all

        wraps = [] if not highlight else self.args.MATCH_WRAPPER if not self.sink else \

                (common.MatchMarkers.START, common.MatchMarkers.END)

        wraps = wraps if isinstance(wraps, (list, tuple)) else [] if wraps is None else [wraps]

        wraps = ((wraps or [""]) * 2)[:2]

        if wraps:  # Track pattern contribution to wrapping

            ops = {ExpressionTree.AND: BooleanResult.and_, ExpressionTree.NOT: BooleanResult.not_,

                   ExpressionTree.OR: functools.partial(BooleanResult.or_, eager=True)}

            self._expressor.configure(operators=ops, void=BooleanResult(None))

        else: self._expressor.configure(operators=ExpressionTree.OPERATORS,

                                        void=ExpressionTree.VOID)  # Ensure defaults

        self._settings.update(highlight=highlight, passthrough=passthrough,

                              pure_anymatch=pure_anymatch, wraps=wraps)

        self.source.configure(self.args0)

        self.sink and self.sink.configure(self.args0)

        if progress and (not no_matching or self.args.MAX_COUNT):

            bar_opts = dict()

            if self.args.MAX_COUNT: bar_opts.update(match_max=self.args.MAX_COUNT)

            if not no_matching: bar_opts.update(source_value=0)  # Count source and match separately

            self.source.configure_progress(**bar_opts)


    def _is_max_done(self):

        """Returns whether max match count has been reached (and message after-context emitted)."""

        result, is_maxed = False, False

        if self.args.MAX_COUNT:

            is_maxed = sum(vv[True] for vv in self._counts.values()) >= self.args.MAX_COUNT

        if not is_maxed and self.args.MAX_PER_TOPIC:

            count_required = self.args.MAX_TOPICS or len(self.source.topics)

            count_maxed = sum(vv[True] >= self.args.MAX_PER_TOPIC

                              or vv[None] >= (self.source.topics.get(k) or 0)

                              for k, vv in self._counts.items())

            is_maxed = (count_maxed >= count_required)

        if is_maxed:

            result = not self.args.AFTER or \

                     not any(self._has_in_window(k, self.args.AFTER, status=True, full=True)

                             for k in self._counts)

        return result


    def _has_in_window(self, topickey, length, status, full=False):

        """Returns whether given status exists in recent message window."""

        if not length or full and len(self._statuses[topickey]) < length:

            return False

        return status in list(self._statuses[topickey].values())[-length:]


    def get_match(self, msg):

        """

        Returns transformed message if all patterns find a match in message, else None.


        Matching field values are converted to strings and surrounded by markers.

        Returns original message if any-match and sink does not require highlighting.

        """


        def process_value(v, parent, top, patterns):

            """

            Populates `field_matches` and `pattern_spans` for patterns matching given string value.

            Populates `field_values`. Returns set of pattern indexes that found a match.

            """

            indexes, spans, topstr = set(), [], ".".join(map(str, top))

            v2 = str(list(v) if isinstance(v, LISTIFIABLES) else v)

            if v and isinstance(v, (list, tuple)): v2 = v2[1:-1]  # Omit collection braces leave []

            for i, (path, p) in enumerate(patterns):

                if path and not path.search(topstr): continue  # for

                matches = [next(p.finditer(v2), None)] if PLAIN_INVERT else list(p.finditer(v2))

                # Join consecutive zero-length matches, extend remaining zero-lengths to end of value

                matchspans = common.merge_spans([x.span() for x in matches if x], join_blanks=True)

                matchspans = [(a, b if a != b else len(v2)) for a, b in matchspans]

                if matchspans:

                    indexes.add(i), spans.extend(matchspans)

                    pattern_spans.setdefault(id(patterns[i]), {})[top] = matchspans

            field_values.setdefault(top, (parent, v, v2))

            if PLAIN_INVERT: spans = [(0, len(v2))] if v2 and not spans else []

            if spans: field_matches.setdefault(top, []).extend(spans)

            return indexes


        def populate_matches(obj, patterns, top=(), parent=None):

            """

            Recursively populates `field_matches`  and `pattern_spans` for fields matching patterns.

            Populates `field_values`. Returns set of pattern indexes that found a match.

            """

            indexes = set()

            selects, noselects = self._patterns["select"], self._patterns["noselect"]

            fieldmap = api.get_message_fields(obj)  # Returns obj if not ROS message

            if fieldmap != obj:

                fieldmap = api.filter_fields(fieldmap, top, include=selects, exclude=noselects)

            for k, t in fieldmap.items() if fieldmap != obj else ():

                v, path = api.get_message_value(obj, k, t), top + (k, )

                if api.is_ros_message(v):  # Nested message

                    indexes |= populate_matches(v, patterns, path, obj)

                elif v and isinstance(v, (list, tuple)) \

                and api.scalar(t) not in api.ROS_NUMERIC_TYPES:

                    for i, x in enumerate(v):  # List of strings or nested messages

                        indexes |= populate_matches(x, patterns, path + (i, ), v)

                else:  # Scalar value, empty list, or list of numbers

                    indexes |= process_value(v, obj, path, patterns)

            if not api.is_ros_message(obj):

                indexes |= process_value(obj, parent, top, patterns)

            return indexes


        def wrap_matches(values, matches):

            """Replaces result-message field values with matched parts wrapped in marker tags."""

            for path, spans in matches.items() if any(WRAPS) else ():

                parent, v1, v2 = values[path]

                for a, b in reversed(common.merge_spans(spans)):  # Backwards for stable indexes

                    v2 = v2[:a] + WRAPS[0] + v2[a:b] + WRAPS[1] + v2[b:]

                if v1 and isinstance(v1, (list, tuple)): v2 = "[%s]" % v2  # Readd collection braces

                if isinstance(parent, list) and isinstance(path[-1], int): parent[path[-1]] = v2

                else: api.set_message_value(parent, path[-1], v2)


        def process_message(obj, patterns):

            """Returns whether message matches patterns, wraps matches in marker tags if so."""

            indexes = populate_matches(obj, patterns)

            is_match = not indexes if self.args.INVERT else len(indexes) == len(patterns)

            if not indexes and self._settings["pure_anymatch"] and not api.get_message_fields(obj):

                is_match = True  # Ensure any-match for messages with no fields

            if is_match and WRAPS: wrap_matches(field_values, field_matches)

            return is_match


        if self._settings["passthrough"]: return msg


        if self._brute_prechecks:

            text  = "\n".join("%r" % (v, ) for _, v, _ in api.iter_message_fields(msg, flat=True))

            if not all(any(p.finditer(text)) for p in self._brute_prechecks):

                return None  # Skip detailed matching if patterns not present at all


        WRAPS         = self._settings["wraps"]

        LISTIFIABLES  = (bytes, tuple) if six.PY3 else (tuple, )

        PLAIN_INVERT  = self.args.INVERT and not self._expression

        field_values  = {}  # {field path: (parent, original value, stringified value)}

        field_matches = {}  # {field path: [(span), ]}

        pattern_spans = {}  # {id(pattern tuple): {field path: (span)}}


        result, is_match = copy.deepcopy(msg) if WRAPS else msg, False

        if self._expression:

            evaler = lambda x: bool(populate_matches(result, [x]))

            terminal = evaler if not WRAPS else lambda x: BooleanResult(x, evaler)

            eager = [ExpressionTree.OR] if WRAPS else ()

            evalresult = self._expressor.evaluate(self._expression, terminal, eager)

            is_match = not evalresult if self.args.INVERT else evalresult

            if is_match and WRAPS:

                actives = [pattern_spans[id(v)] for v in evalresult]

                matches = {k: sum((v.get(k, []) for v in actives), [])

                           for k in set(sum((list(v) for v in actives), []))} or \

                          {k: [(0, len(v))] for k, (_, _, v) in field_values.items()}  # Wrap all

                wrap_matches(field_values, matches)

        else:

            is_match = process_message(result, self._patterns["content"])

        return result if is_match else None


class ExpressionTree(object):

    """

    Parses and evaluates operator expressions like "a AND (b OR NOT c)".


    Operands can be quoted strings, '\' can be used to escape quotes within the string.

    Operators are case-insensitive.

    """


    QUOTES, ESCAPE, LBRACE, RBRACE, WHITESPACE = "'\"", "\\", "(", ")", " \n\r\t"

    SEPARATORS = WHITESPACE + LBRACE + RBRACE

    AND, OR, NOT, VAL = "AND", "OR", "NOT", "VAL"


    CASED     = False      # Whether operators are case-sensitive

    IMPLICIT  = AND        # Implicit operator inserted between operands lacking one

    UNARIES   = (NOT, )    # Unary operators, expecting operand after operator

    BINARIES  = (AND, OR)  # Binary operators, expecting operands before and after operator

    OPERATORS = {AND: (lambda a, b: a and b), OR: (lambda a, b: a or b), NOT: lambda a: not a}

    RANKS     = {VAL: 1, NOT: 2, AND: 3, OR: 4}


    SHORTCIRCUITS    = {AND: False, OR: True}  # Values for binary operators to short-circuit on

    FORMAT_TEMPLATES = {AND: "%s and %s", OR: "%s or %s", NOT: "not %s"}

    VOID = None  # Placeholder for operands skipped as short-circuited


    def __init__(self, **props):

        """

        @param   props  class property overrides, case-insensitive, e.g. `cased=False`

        """

        self._state = None  # Temporary state namespace dictionary during parse

        self.configure(**props)


    def configure(self, **props):

        """

        Overrides instance configuration.


        @param   props  class property overrides, case-insensitive, e.g. `cased=False`

        """

        for k, v in props.items():

            K, V = k.upper(), getattr(self, k.upper())

            accept = (type(V), type(None)) if "IMPLICIT" == K else () if "VOID" == K else type(V)

            if accept and not isinstance(v, accept) and set(map(type, (v, V))) - set([list, tuple]):

                raise ValueError("Invalid value for %s=%s: expected %s" % (k, v, type(V).__name__))

            setattr(self, K, v)


    def evaluate(self, tree, terminal=None, eager=()):

        """

        Returns result of evaluating expression tree.


        @param   tree      expression tree structure as given by parse()

        @param   terminal  callback(value) to evaluate value nodes with, if not using value directly

        @param   eager     operators where to evaluate both operands in full, despite short-circuit

        """

        stack = [(tree, [], [], None)] if tree else []

        while stack:  # [(node, evaled vals, parent evaled vals, parent op)]

            ((op, val), nvals, pvals, parentop), done = stack.pop(), set()

            if nvals: done.add(pvals.append(self.OPERATORS[op](*nvals)))  # Backtracking: fill parent

            elif pvals and parentop in self.SHORTCIRCUITS and not (eager and parentop in eager):

                ctor = type(self.SHORTCIRCUITS[parentop])  # Skip if first sibling short-circuits op

                if ctor(pvals[0]) == self.SHORTCIRCUITS[parentop]: done.add(pvals.append(self.VOID))

            if done: continue  # while

            if op not in self.OPERATORS: pvals.append(val if terminal is None else terminal(val))

            else: stack.extend([((op, val), nvals, pvals, parentop)] +

                               [(v, [], nvals, op) for v in val[::-1]])  # Queue in processing order

        return pvals.pop() if tree else None


    def format(self, tree, terminal=None):

        """

        Returns expression tree formatted as string.


        @param   tree      expression tree structure as given by parse()

        @param   terminal  callback(value) to format value nodes with, if not using value directly

        """

        BRACED = "%s".join(self.FORMAT_TEMPLATES.get(x, x) for x in [self.LBRACE, self.RBRACE])

        TPL = lambda op: ("%s {0} %s" if op in self.BINARIES else "{0} %s").format(op)

        WRP = lambda op, parentop: BRACED if self.RANKS[op] > self.RANKS[parentop] else "%s"

        FMT = lambda vv, op, nodes: tuple(WRP(nop, op) % v for (nop, _), v in zip(nodes, vv))

        stack = [(tree, [], [])] if tree else [] # [(node, formatted vals, parent formatted vals)]

        while stack:  # Add to parent if all processed or terminal node, else queue for processing

            (op, val), nvals, pvals = stack.pop()

            if nvals: pvals.append((self.FORMAT_TEMPLATES.get(op) or TPL(op)) % FMT(nvals, op, val))

            elif op not in self.OPERATORS: pvals.append(val if terminal is None else terminal(val))

            else: stack.extend([((op, val), nvals, pvals)] + [(v, [], nvals) for v in val[::-1]])

        return pvals.pop() if tree else ""


    def parse(self, text, terminal=None):

        """

        Returns an operator expression like "a AND (b OR NOT c)" parsed into a binary tree.


        Binary tree like ["AND", [["VAL", "a"], ["OR", [["VAL", "b"], ["NOT", [["VAL", "c"]]]]]]].

        Raises on invalid expression.


        @param   terminal  callback(text) returning node value for operands, if not using plain text

        """

        root, node, buf, quote, escape, i = [], [], "", "", "", -1

        self._state = locals()

        h = self._make_helpers(self._state, text, terminal)


        for i, char in enumerate(text + " "):  # Append space to simplify termination

            # First pass: handle quotes, or explicit/implicit word ends and operators

            if quote:

                if escape:

                    if   char == self.ESCAPE: char = ""  # Double escape: retain single

                    elif char in self.QUOTES: buf = buf[:-1]  # Drop escape char from before quote

                elif char == quote:  # End quote

                    (node, root), buf, quote, char = h.add_node(self.VAL, buf, i), "", "", ""

                escape = char if self.ESCAPE == char else ""

            elif char in self.QUOTES:

                h.validate(i, "quotes", buf=buf)

                if node and h.finished(node): node, root = h.add_implicit(node, i)

                quote, char = char, ""  # Start quoted string, consume quotemark

            elif char in self.SEPARATORS:

                op = h.parse_op(buf)

                if op:  # Explicit operator

                    h.validate(i, "op", op=op)

                    if op in self.UNARIES and node and h.finished(node):

                        node, root = h.add_implicit(node, i)

                    val = h.make_val(op, None if op in self.UNARIES else node)

                    node, root = h.add_node(op, val, i)

                else:  # Consume accumulated buffer if any, handle implicit operators

                    if (buf or char == self.LBRACE) and node and h.finished(node):

                        node, root = h.add_implicit(node, i)

                    if buf: node, root = h.add_node(self.VAL, buf, i)  # Completed operand

                buf = ""

            # Second pass: accumulate text buffer, or enter/exit bracket groups

            if quote or char not in self.SEPARATORS: buf += char

            elif char == self.LBRACE: _, (node, root) = h.stack_push((node, root, i)), ([], [])

            elif char == self.RBRACE: _, (node, root) = h.validate(i, "rbrace"), h.stack_pop()

            self._state.update(locals())

        h.validate(i)

        return root


    def _make_helpers(self, state, text, terminal=None):

        """Returns namespace object with parsing helper functions."""

        ERRLABEL, OP_MAXLEN = "Invalid expression: ", max(map(len, self.OPERATORS))

        OPERATORS = {x if self.CASED else x.upper(): x for x in self.OPERATORS}

        stack, parents = [], {}


        finished  = lambda n:     not (isinstance(n[1], list) and n[1] and n[1][-1] is None)

        outranks  = lambda a, b:  self.RANKS[a] > self.RANKS[b]    # whether operator a ranks over b

        postbrace = lambda:       state.get("stacki") is not None  # whether brackets just ended

        mark      = lambda i:     "\n%s\n%s^" % (text, " " * i)    # expression text marked at pos

        oper      = lambda n:     n[0]                             # node type

        parse_op  = lambda b:     OPERATORS.get(b if self.CASED else b.upper()) \

                                  if len(b) <= OP_MAXLEN else None

        make_node = lambda o, v:  [o, terminal(v) if terminal and self.VAL == o else v]

        make_val  = lambda o, *a: list(a) + [None] * (1 + (o in self.BINARIES) - len(a))

        add_child = lambda a, b:  (a[1].__setitem__(-1, b), parents.update({id(b): a}))

        get_child = lambda n, i:  n[1][i] if n[0] in self.OPERATORS else None


        def missing(op, first=False):  # Return error text for missing operand in operator

            label = ("1st " if first else "2nd ") if op in self.BINARIES else ""

            return ERRLABEL + "missing %selement for %s-operator" % (label, op)


        def add_node(op, val, i):  # Add new node to tree, return (node to use as last, root)

            node0, root0 = _, newroot = state["node"], state["root"]

            if op in self.BINARIES:  # Attach last child or root to new if needed

                if not postbrace() and finished(node0) and not outranks(op, oper(node0)):

                    val = make_val(op, get_child(node0, -1), None)  # Last child into new

                elif not outranks(oper(root0), op):

                    val = make_val(op, root0, None)  # Root into new

            newnode = make_node(op, val)


            if node0 and not postbrace() and (not finished(node0)  # Last is unfinished

            or oper(node0) in self.BINARIES and not outranks(op, oper(node0))):  # op <= last binop

                add_child(node0, newnode)  # Attach new node to last

            elif not root0 or (root0 is node0 if postbrace() else not outranks(oper(root0), op)):

                newroot = newnode  # Replace root if new outranks, or expression so far was braced

            latest = node0 if node0 and op == self.VAL else newnode

            while oper(latest) in self.UNARIES and finished(latest) and id(latest) in parents:

                latest = parents[id(latest)]  # Walk up filled unary nodes until binop/root

            state.update(node=latest, root=newroot, nodei=i, stacki=None)

            return latest, newroot


        def add_implicit(node, i):  # Add implicit operator, return (node to use as last, root)

            if not self.IMPLICIT: raise ValueError(ERRLABEL + "missing operator" + mark(i))

            return add_node(self.IMPLICIT, make_val(self.IMPLICIT, node), i)


        def stack_pop():  # Unstack previous and add current, return (node to use as last, root)

            (node, root, stacki), nodex, rootx = stack.pop(), state["node"], state["root"]

            if node: node, stacki, _ = root, None, add_child(node, rootx)  # Nest into last

            elif not root: node, root = nodex, rootx  # Replace empty root with nested

            state.update(node=node, root=root, stacki=stacki)

            return node, root


        def validate(i, ctx=None, **kws):  # Raise ValueError if parse state invalid

            if "quotes" == ctx:

                if kws["buf"]: raise ValueError(ERRLABEL + "invalid syntax" + mark(i))

            elif "op" == ctx:

                op, node = kws["op"], state["node"]

                if op in self.BINARIES and (not node or not finished(node)):

                    raise ValueError(missing(oper(node) if node else op, first=not node) + mark(i))

            elif "rbrace" == ctx:

                node, nodei = (state.get(k) for k in ("node", "nodei"))

                if not stack: raise ValueError(ERRLABEL + "bracket end has no start" + mark(i))

                if not node: raise ValueError(ERRLABEL + "empty bracket" + mark(i))

                if not finished(node): raise ValueError(missing(oper(node)) + mark(nodei))

            else:  # All parsing done, tree in final state

                quote, node, nodei = (state.get(k) for k in ("quote", "node", "nodei"))

                if quote: raise ValueError(ERRLABEL + "unfinished quote" + mark(i - 1))

                if stack: raise ValueError(ERRLABEL + "unterminated bracket" + mark(stack[-1][-1]))

                if node and not finished(node): raise ValueError(missing(oper(node)) + mark(nodei))


        return Namespace(add_child=add_child, add_implicit=add_implicit, add_node=add_node,

                         make_val=make_val, finished=finished, parse_op=parse_op,

                         stack_push=stack.append, stack_pop=stack_pop, validate=validate)


class BooleanResult(object):

    """Accumulative result of boolean expression evaluation, tracking value contribution."""


    def __init__(self, value=Ellipsis, terminal=None, **__props):

        self._result  = Ellipsis  # Final accumulated result of expression

        self._values  = []  # All accumulated operands

        self._actives = []  # For each operand, True/False/None: active/invertedly active/inactive

        for k, v in __props.items(): setattr(self, "_" + k, v)

        if value is not Ellipsis: self.set(value, terminal)


    def set(self, value, terminal=None):

        """Sets value to instance, using terminal callback for evaluation if given."""

        self._result = bool(terminal(value) if terminal else value)

        self._values, self._actives = [value], [True if self._result else None]


    def __iter__(self):

        """Yields active values: contributing to true result positively."""

        for v in (v for v, a in zip(self._values, self._actives) if a): yield v


    def __bool__(self):      return self._result  # Py3

    def __nonzero__(self):   return self._result  # Py2´

    def __eq__(self, other): return (bool(self) if isinstance(other, bool) else self) is other


    @classmethod

    def and_(cls, a, b):

        """Returns new BooleanResult as a and b."""

        actives = [on if y else None for x, y in ((a, b), (b, a)) for on in x._actives]

        return cls(result=bool(a and b), values=a._values + b._values, actives=actives)


    @classmethod

    def or_(cls, a, b, eager=False):

        """Returns new BooleanResult as a or b."""

        actives = a._actives + [x if eager or not a else None for x in b._actives]

        return cls(result=bool(a or b), values=a._values + b._values, actives=actives)


    @classmethod

    def not_(cls, a):

        """Returns new BooleanResult as not a."""

        actives = [None if x is None else not x for x in a._actives]

        return cls(result=not a, values=a._values, actives=actives)


__all__ = ["BooleanResult", "ExpressionTree", "Scanner"]

grepros.api.Bag
Bag factory metaclass.
Definition api.py:381

grepros.common.MatchMarkers
Highlight markers for matches in message values.
Definition common.py:50

grepros.inputs.AppSource
Produces messages from iterable or pushed data.
Definition inputs.py:1276

grepros.inputs.BagSource
Produces messages from ROS bagfiles.
Definition inputs.py:522

grepros.inputs.Source
Message producer base class.
Definition inputs.py:35

grepros.outputs.Sink
Output base class.
Definition outputs.py:32

grepros.search.BooleanResult
Accumulative result of boolean expression evaluation, tracking value contribution.
Definition search.py:787

grepros.search.BooleanResult.or_
or_(cls, a, b, eager=False)
Returns new BooleanResult as a or b.
Definition search.py:817

grepros.search.BooleanResult.not_
not_(cls, a)
Returns new BooleanResult as not a.
Definition search.py:823

grepros.search.BooleanResult.and_
and_(cls, a, b)
Returns new BooleanResult as a and b.
Definition search.py:811

grepros.search.ExpressionTree
Parses and evaluates operator expressions like "a AND (b OR NOT c)".
Definition search.py:579

grepros.search.ExpressionTree.UNARIES
tuple UNARIES
Definition search.py:587

grepros.search.ExpressionTree.FORMAT_TEMPLATES
dict FORMAT_TEMPLATES
Definition search.py:593

grepros.search.ExpressionTree.configure
configure(self, **props)
Overrides instance configuration.
Definition search.py:610

grepros.search.ExpressionTree.__init__
__init__(self, **props)
Definition search.py:600

grepros.search.ExpressionTree.VAL
VAL
Definition search.py:583

grepros.search.ExpressionTree.LBRACE
LBRACE
Definition search.py:581

grepros.search.ExpressionTree.IMPLICIT
IMPLICIT
Definition search.py:586

grepros.search.ExpressionTree.OPERATORS
dict OPERATORS
Definition search.py:589

grepros.search.ExpressionTree.RBRACE
RBRACE
Definition search.py:581

grepros.search.ExpressionTree.ESCAPE
ESCAPE
Definition search.py:581

grepros.search.ExpressionTree.SEPARATORS
SEPARATORS
Definition search.py:582

grepros.search.ExpressionTree.BINARIES
tuple BINARIES
Definition search.py:588

grepros.search.ExpressionTree.SHORTCIRCUITS
dict SHORTCIRCUITS
Definition search.py:592

grepros.search.ExpressionTree.evaluate
evaluate(self, tree, terminal=None, eager=())
Returns result of evaluating expression tree.
Definition search.py:626

grepros.search.ExpressionTree.QUOTES
QUOTES
Definition search.py:581

grepros.search.ExpressionTree.parse
parse(self, text, terminal=None)
Returns an operator expression like "a AND (b OR NOT c)" parsed into a binary tree.
Definition search.py:669

grepros.search.ExpressionTree.RANKS
dict RANKS
Definition search.py:590

grepros.search.ExpressionTree.format
format(self, tree, terminal=None)
Returns expression tree formatted as string.
Definition search.py:647

grepros.search.ExpressionTree.VOID
VOID
Definition search.py:594

grepros.search.ExpressionTree.CASED
bool CASED
Definition search.py:585

grepros.search.Scanner._patterns
_patterns
Definition search.py:98

grepros.search.Scanner.validate
validate(self, reset=False)
Returns whether conditions have valid syntax, prints errors.
Definition search.py:210

grepros.search.Scanner.source
source
Source instance.
Definition search.py:120

grepros.search.Scanner.__init__
__init__(self, args=None, **kwargs)
Definition search.py:96

grepros.search.Scanner.work
work(self, source, sink)
Greps messages yielded from source and emits matched content to sink.
Definition search.py:196

grepros.search.Scanner.find
find(self, source, highlight=None)
Yields matched and context messages from source.
Definition search.py:143

grepros.search.Scanner.valid
valid
Result of validate()
Definition search.py:124

grepros.search.Scanner.__exit__
__exit__(self, exc_type, exc_value, traceback)
Context manager exit, does nothing.
Definition search.py:241

grepros.search.Scanner.args
args
Definition search.py:127

grepros.search.Scanner.__enter__
__enter__(self)
Context manager entry, does nothing, returns self.
Definition search.py:236

grepros.search.Scanner.args0
args0
Definition search.py:126

grepros.search.Scanner.sink
sink
Sink instance.
Definition search.py:122

grepros.search.Scanner.GrepMessage
GrepMessage
Namedtuple of (topic name, ROS message, ROS time object, message if matched, index in topic).
Definition search.py:39

grepros.search.Scanner.match
match(self, topic, msg, stamp, highlight=None)
Returns matched message if message matches search filters.
Definition search.py:162

grepros.search.Scanner.get_match
get_match(self, msg)
Returns transformed message if all patterns find a match in message, else None.
Definition search.py:472

grepros.search.Scanner.ANY_MATCHES
list ANY_MATCHES
Match patterns for global any-match.
Definition search.py:42