本文整理汇总了Python中regex.MULTILINE属性的典型用法代码示例。如果您正苦于以下问题:Python regex.MULTILINE属性的具体用法?Python regex.MULTILINE怎么用?Python regex.MULTILINE使用的例子?那么, 这里精选的属性代码示例或许可以为您提供帮助。您也可以进一步了解该属性所在类regex
的用法示例。
在下文中一共展示了regex.MULTILINE属性的11个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: __init__
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def __init__(self, **kwargs):
"""
Args:
annotators: None or empty set (only tokenizes).
substitutions: if true, normalizes some token types (e.g. quotes).
"""
self._regexp = regex.compile(
'(?P<digit>%s)|(?P<title>%s)|(?P<abbr>%s)|(?P<neg>%s)|(?P<hyph>%s)|'
'(?P<contr1>%s)|(?P<alphanum>%s)|(?P<contr2>%s)|(?P<sdquote>%s)|'
'(?P<edquote>%s)|(?P<ssquote>%s)|(?P<esquote>%s)|(?P<dash>%s)|'
'(?<ellipses>%s)|(?P<punct>%s)|(?P<nonws>%s)' %
(self.DIGIT, self.TITLE, self.ABBRV, self.NEGATION, self.HYPHEN,
self.CONTRACTION1, self.ALPHA_NUM, self.CONTRACTION2,
self.START_DQUOTE, self.END_DQUOTE, self.START_SQUOTE,
self.END_SQUOTE, self.DASH, self.ELLIPSES, self.PUNCT,
self.NON_WS),
flags=regex.IGNORECASE + regex.UNICODE + regex.MULTILINE
)
if len(kwargs.get('annotators', {})) > 0:
logger.warning('%s only tokenizes! Skipping annotators: %s' %
(type(self).__name__, kwargs.get('annotators')))
self.annotators = set()
self.substitutions = kwargs.get('substitutions', True)
示例2: extract_ipv4
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def extract_ipv4(data):
#regexp = re.compile(r'\s?((25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}(25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\s?', flags=re.MULTILINE)
regexp = re.compile(r'[\s():{}\[\]]{1}((25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}(25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)[\s():{}\[\]]{1}', flags=re.MULTILINE)
regexp = re.compile(r'[^0-9]?(\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3})[^0-9]?', flags=re.MULTILINE)
match = regexp.finditer(data)
result = []
for m in match:
try:
ipaddress.ip_address(m.group(1))
result.append(m.group(1))
except ValueError:
continue
#ip = m.group(0).strip(' ():{}[]')
#ip = ip.strip()
#if ip:
# result.append(ip)
return result
示例3: regex_match_score
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def regex_match_score(prediction, pattern):
"""Check if the prediction matches the given regular expression."""
try:
compiled = re.compile(
pattern,
flags=re.IGNORECASE + re.UNICODE + re.MULTILINE
)
except BaseException:
logger.warn('Regular expression failed to compile: %s' % pattern)
return False
return compiled.match(prediction) is not None
示例4: __init__
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def __init__(self, **kwargs):
"""
Args:
annotators: None or empty set (only tokenizes).
"""
self._regexp = regex.compile(
'(%s)|(%s)' % (self.ALPHA_NUM, self.NON_WS),
flags=regex.IGNORECASE + regex.UNICODE + regex.MULTILINE
)
if len(kwargs.get('annotators', {})) > 0:
logger.warning('%s only tokenizes! Skipping annotators: %s' %
(type(self).__name__, kwargs.get('annotators')))
self.annotators = set()
示例5: regex_match
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def regex_match(text, pattern):
"""Test if a regex pattern is contained within a text."""
try:
pattern = re.compile(
pattern,
flags=re.IGNORECASE + re.UNICODE + re.MULTILINE,
)
except BaseException:
return False
return pattern.search(text) is not None
示例6: iter_release_notes
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def iter_release_notes(repo, from_ref, to_ref, default_role):
"""Yield release notes from `from_ref` to `to_ref`."""
pattern = re.compile(
r'^(?:{})\s+#(\d+)\s+from'.format('|'.join(GITHUB_CLOSE_KEYWORDS)),
flags=re.MULTILINE | re.IGNORECASE,
)
for commit in commits_between(
repo, from_ref, to_ref, options=pygit2.GIT_SORT_TOPOLOGICAL
):
message = commit.message.strip()
subject, *lines = map(str.strip, message.splitlines())
tag, *rest = subject.split(':', 1)
tag = tag.lower()
lineitem = ''.join(rest) or subject
role = KEYWORD_MAP.get(tag, default_role)
modifier = ' major' if role == 'bug' else ''
try:
issue_number, *_ = pattern.findall(message)
except ValueError:
issue_number = '-'
yield "* :{role}:`{issue_number}{modifier}` {lineitem}".format(
role=role,
issue_number=issue_number,
modifier=modifier,
lineitem=lineitem.strip(),
)
示例7: __init__
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def __init__(self, **kwargs):
"""
Args:
annotators: None or empty set (only tokenizes).
"""
self._regexp = regex.compile(
'(%s)|(%s)' % (self.ALPHA_NUM, self.NON_WS),
flags=regex.IGNORECASE + regex.UNICODE + regex.MULTILINE,
)
if len(kwargs.get('annotators', {})) > 0:
logger.warning(
'%s only tokenizes! Skipping annotators: %s'
% (type(self).__name__, kwargs.get('annotators'))
)
self.annotators = set()
示例8: __init__
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def __init__(self, **kwargs):
"""
Args:
annotators: None or empty set (only tokenizes).
substitutions: if true, normalizes some token types (e.g. quotes).
"""
self._regexp = regex.compile(
'(?P<digit>%s)|(?P<title>%s)|(?P<abbr>%s)|(?P<neg>%s)|(?P<hyph>%s)|'
'(?P<contr1>%s)|(?P<alphanum>%s)|(?P<contr2>%s)|(?P<sdquote>%s)|'
'(?P<edquote>%s)|(?P<ssquote>%s)|(?P<esquote>%s)|(?P<dash>%s)|'
'(?<ellipses>%s)|(?P<punct>%s)|(?P<nonws>%s)'
% (
self.DIGIT,
self.TITLE,
self.ABBRV,
self.NEGATION,
self.HYPHEN,
self.CONTRACTION1,
self.ALPHA_NUM,
self.CONTRACTION2,
self.START_DQUOTE,
self.END_DQUOTE,
self.START_SQUOTE,
self.END_SQUOTE,
self.DASH,
self.ELLIPSES,
self.PUNCT,
self.NON_WS,
),
flags=regex.IGNORECASE + regex.UNICODE + regex.MULTILINE,
)
if len(kwargs.get('annotators', {})) > 0:
logger.warning(
'%s only tokenizes! Skipping annotators: %s'
% (type(self).__name__, kwargs.get('annotators'))
)
self.annotators = set()
self.substitutions = kwargs.get('substitutions', True)
示例9: regex_search
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def regex_search(
self,
pattern: str,
ignore_case: bool = False,
multiline: bool = False,
dotall: bool = False,
unicode: bool = False,
extended: bool = False,
):
"""Regex search on current data
Args:
pattern (str): Required. The regex pattern to search by
ignore_case (bool, optional): Set case insentive flag. Defaults to False.
multiline (bool, optional): ^/$ match start/end. Defaults to False.
dotall (bool, optional): `.` matches newline. Defaults to False.
unicode (bool, optional): Match unicode characters. Defaults to False.
extended (bool, optional): Ignore whitespace. Defaults to False.
Returns:
Chepy: The Chepy object.
Examples:
>>> c = Chepy("loLolololoL")
>>> c.regex_search("ol", ignore_case=True)
"""
flags = 0
if ignore_case:
flags += re.IGNORECASE
if multiline:
flags += re.MULTILINE
if dotall:
flags += re.DOTALL
if unicode:
flags += re.UNICODE
if extended:
flags += re.X
self.state = re.findall(pattern, self._convert_to_str(), flags=flags)
return self
示例10: setup_parser
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def setup_parser():
from lexnlp.extract.en.amounts import CURRENCY_SYMBOL_MAP
symbols = '|'.join([k for k in CURRENCY_SYMBOL_MAP]).replace('$', r'\$')
ParsedTextCorrector.PATTERN_MONEY_BREAK = ParsedTextCorrector.PATTERN_MONEY_BREAK.format(symbols=symbols)
ParsedTextCorrector.REGEX_MONEY_BREAK = re.compile(
ParsedTextCorrector.PATTERN_MONEY_BREAK,
re.IGNORECASE | re.DOTALL | re.MULTILINE | re.VERBOSE | re.UNICODE)
示例11: __init__
# 需要导入模块: import regex [as 别名]
# 或者: from regex import MULTILINE [as 别名]
def __init__(self, pattern, flags=re.UNICODE | re.MULTILINE, name=None):
super(Regex, self).__init__(name)
self.__pattern = re.compile(pattern, flags=flags)