# Copyright 2013 Dean Gardiner # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. from logr import Logr class CaptureStep(object): REPR_KEYS = ['regex', 'func', 'single'] def __init__(self, capture_group, tag, source, regex=None, func=None, single=None): #: @type: CaptureGroup self.capture_group = capture_group #: @type: str self.tag = tag #: @type: str self.source = source #: @type: str self.regex = regex #: @type: function self.func = func #: @type: bool self.single = single def _get_next_subject(self, parser): if self.source == 'fragment': if not parser.fragment_available(): return None return parser.next_fragment() elif self.source == 'closure': if not parser.closure_available(): return None return parser.next_closure() raise NotImplementedError() def execute(self, fragment): if self.regex: weight, match, num_fragments = self.capture_group.parser.matcher.fragment_match(fragment, self.regex) Logr.debug('(execute) [regex] tag: "%s"', self.tag) if match: return True, weight, match, num_fragments elif self.func: match = self.func(fragment) Logr.debug('(execute) [func] %s += "%s"', self.tag, match) if match: return True, 1.0, match, 1 else: Logr.debug('(execute) [raw] %s += "%s"', self.tag, fragment.value) return True, 1.0, fragment.value, 1 return False, None, None, 1 def __repr__(self): attribute_values = [key + '=' + repr(getattr(self, key)) for key in self.REPR_KEYS if hasattr(self, key) and getattr(self, key)] attribute_string = ', ' + ', '.join(attribute_values) if len(attribute_values) > 0 else '' return "CaptureStep('%s'%s)" % (self.tag, attribute_string)