bumpver/src/pycalver/parse.py

117 lines
3.1 KiB
Python
Raw Normal View History

2018-09-02 21:48:12 +02:00
# This file is part of the pycalver project
# https://github.com/mbarkhau/pycalver
#
2018-11-06 21:45:33 +01:00
# Copyright (c) 2018 Manuel Barkhau (@mbarkhau) - MIT License
2018-09-02 21:48:12 +02:00
# SPDX-License-Identifier: MIT
import re
import logging
import typing as typ
2018-09-02 23:36:57 +02:00
import pkg_resources
2018-09-02 21:48:12 +02:00
log = logging.getLogger("pycalver.parse")
VALID_RELESE_VALUES = ("alpha", "beta", "dev", "rc", "post")
2018-09-02 23:36:57 +02:00
# https://regex101.com/r/fnj60p/10
2018-11-06 21:45:33 +01:00
PYCALVER_PATTERN = r"""
2018-09-02 21:48:12 +02:00
\b
(?P<version>
(?P<calver>
v # "v" version prefix
(?P<year>\d{4})
(?P<month>\d{2})
)
2018-09-02 23:36:57 +02:00
(?P<build>
2018-09-02 21:48:12 +02:00
\. # "." build nr prefix
2018-09-02 23:36:57 +02:00
\d{4,}
2018-09-02 21:48:12 +02:00
)
2018-09-02 23:36:57 +02:00
(?P<release>
2018-09-02 21:48:12 +02:00
\- # "-" release prefix
2018-09-02 23:36:57 +02:00
(?:alpha|beta|dev|rc|post)
2018-09-02 21:48:12 +02:00
)?
)(?:\s|$)
2018-11-06 21:45:33 +01:00
"""
2018-09-02 21:48:12 +02:00
2018-11-06 21:45:33 +01:00
PYCALVER_RE: typ.Pattern[str] = re.compile(PYCALVER_PATTERN, flags=re.VERBOSE)
PATTERN_ESCAPES = [
("\u005c", "\u005c\u005c"),
("-" , "\u005c-"),
("." , "\u005c."),
("+" , "\u005c+"),
("*" , "\u005c*"),
("[" , "\u005c["),
("(" , "\u005c("),
]
2018-09-02 21:48:12 +02:00
2018-09-03 09:19:27 +02:00
# NOTE (mb 2018-09-03): These are matchers for parts, which are
# used in the patterns, they're not for validation. This means
# that they may find strings, which are not valid pycalver
# strings, when parsed in their full context. For such cases,
# the patterns should be expanded.
2018-09-02 21:48:12 +02:00
RE_PATTERN_PARTS = {
2018-11-06 21:45:33 +01:00
'pep440_version': r"\d{6}\.[1-9]\d*(a|b|dev|rc|post)?\d*",
'version' : r"v\d{6}\.\d{4,}(\-(alpha|beta|dev|rc|post))?",
'calver' : r"v\d{6}",
'build' : r"\.\d{4,}",
'release' : r"(\-(alpha|beta|dev|rc|post))?",
2018-09-02 21:48:12 +02:00
}
class PatternMatch(typ.NamedTuple):
2018-11-06 21:45:33 +01:00
lineno : int # zero based
line : str
pattern: str
span : typ.Tuple[int, int]
match : str
2018-09-02 21:48:12 +02:00
2018-09-02 23:36:57 +02:00
class VersionInfo(typ.NamedTuple):
2018-11-06 21:45:33 +01:00
pep440_version: str
version : str
calver : str
year : str
month : str
build : str
release : typ.Optional[str]
2018-09-02 23:36:57 +02:00
def parse_version_info(version: str) -> VersionInfo:
match = PYCALVER_RE.match(version)
2018-09-04 09:56:53 +02:00
if match is None:
raise ValueError(f"Invalid pycalver: {version}")
2018-09-03 09:19:27 +02:00
pep440_version = str(pkg_resources.parse_version(version))
2018-09-02 23:36:57 +02:00
return VersionInfo(pep440_version=pep440_version, **match.groupdict())
2018-09-02 21:48:12 +02:00
2018-11-06 21:45:33 +01:00
def _iter_pattern_matches(lines: typ.List[str], pattern: str) -> typ.Iterable[PatternMatch]:
2018-09-02 21:48:12 +02:00
# The pattern is escaped, so that everything besides the format
# string variables is treated literally.
2018-11-06 21:45:33 +01:00
pattern_tmpl = pattern
for char, escaped in PATTERN_ESCAPES:
pattern_tmpl = pattern_tmpl.replace(char, escaped)
pattern_str = pattern_tmpl.format(**RE_PATTERN_PARTS)
pattern_re = re.compile(pattern_str)
2018-09-02 23:36:57 +02:00
for lineno, line in enumerate(lines):
2018-09-02 21:48:12 +02:00
match = pattern_re.search(line)
if match:
yield PatternMatch(lineno, line, pattern, match.span(), match.group(0))
def parse_patterns(lines: typ.List[str], patterns: typ.List[str]) -> typ.List[PatternMatch]:
all_matches: typ.List[PatternMatch] = []
for pattern in patterns:
2018-11-06 21:45:33 +01:00
all_matches.extend(_iter_pattern_matches(lines, pattern))
2018-09-02 21:48:12 +02:00
return all_matches