17 Commits
0.1.0 ... 0.2.0

Author SHA1 Message Date
ddfd96193d fix setup.cfg 2021-04-18 22:14:12 -07:00
dc5cc2ddd9 Release 0.2.0 2021-04-18 22:07:17 -07:00
57542e228e Update CHANGELOG.md 2021-04-18 22:04:22 -07:00
13ddc5a1f9 Gracefully handle H2s that dont match the schema 2021-04-18 22:01:31 -07:00
98c21e4078 Cleanup unused code 2021-04-18 20:10:03 -07:00
fb35ad3b29 Fix link parsing 2021-04-18 20:02:50 -07:00
849438a5f5 reworked 2-step parser that can handle setext headers 2021-04-18 18:45:39 -07:00
fa97e9154b Fix paragraph separation 2021-04-18 17:11:09 -07:00
f6f7a8b500 README formatting 2021-04-18 17:10:52 -07:00
7b694bc3c0 Add logo to readme 2021-04-18 17:01:21 -07:00
2e2a5834e6 Add logo 2021-04-18 16:57:55 -07:00
fbdd3f8971 code block support, kind-of 2021-04-18 12:36:27 -07:00
9ee8096e33 Improved parsing and add write() method
Tool now has round-trip accuracy with test file!
2021-04-18 03:02:33 -07:00
b5c4a1757e better version header formatting 2021-04-18 00:25:24 -07:00
1b263ad38f Copyright comment 2021-04-18 00:25:05 -07:00
a900679eb6 Fix python_requires tag 2021-04-17 21:53:16 -07:00
c999822bd0 Add changelog link 2021-04-17 00:29:13 -07:00
5 changed files with 226 additions and 82 deletions

View File

@ -1,9 +1,24 @@
# Changelog
All notable changes to this project will be documented in this file
## 0.2.0
### Added
- New yak log logo drawn by my sister
### Changed
- Updated package metadata
- Rewrote parser to use a 2-step method that is more flexible.
- Parser can now handle code blocks.
- Parser can now handle setext-style headers and H2s not conforming to the
schema.
## 0.1.0 - 2021-04-16
First release
### Added
- `yaclog.read()` method to parse changelog files

View File

@ -1,2 +1,6 @@
# yet-another-changelog
# Yaclog
Yet another changelog command line tool
![a yak who is a log](https://github.com/drewcassidy/yaclog/raw/main/logo.png)
*Logo by Erin Cassidy*

BIN
logo.png Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 11 KiB

View File

@ -7,7 +7,6 @@ license = AGPLv3
license_file = LICENSE.md
long_description = file: README.md
long_description_content_type = text/markdown
url = https://github.com/drewcassidy/yet-another-changelog
keywords = changelog, commandline, markdown
classifiers =
@ -23,7 +22,11 @@ classifiers =
Topic :: Software Development :: Version Control :: Git
Topic :: Utilities
project_urls =
Source Code = https://github.com/drewcassidy/yaclog
Changelog = https://github.com/drewcassidy/yaclog/blob/main/CHANGELOG.md
[options]
install_requires = Click; GitPython
python_requires >= 3.8
python_requires = >= 3.8
packages = find:

View File

@ -1,3 +1,19 @@
# yaclog: yet another changelog tool
# Copyright (c) 2021. Andrew Cassidy
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as
# published by the Free Software Foundation, either version 3 of the
# License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program. If not, see <https://www.gnu.org/licenses/>.
import datetime
import os
import re
@ -7,6 +23,13 @@ from typing import List, Tuple, Optional
bullets = '+-*'
brackets = '[]'
code_regex = re.compile(r'^```')
header_regex = re.compile(r'^(?P<hashes>#+)\s+(?P<contents>[^#]+)(?:\s+#+)?$')
under1_regex = re.compile(r'^=+\s*$')
under2_regex = re.compile(r'^-+\s*$')
bullet_regex = re.compile(r'^[-+*]')
linkid_regex = re.compile(r'^\[(?P<link_id>\S*)]:\s*(?P<link>.*)')
def _strip_link(token):
if link_literal := re.fullmatch(r'\[(.*?)]\((.*?)\)', token):
@ -20,6 +43,22 @@ def _strip_link(token):
return token, None, None
def _join_markdown(segments: List[str]) -> str:
text: List[str] = []
last_bullet = False
for segment in segments:
is_bullet = bullet_regex.match(segment) and '\n' not in segment
if not is_bullet or not last_bullet:
text.append('')
text.append(segment)
last_bullet = is_bullet
return '\n'.join(text).strip()
class VersionEntry:
def __init__(self):
self.sections = {'': []}
@ -27,17 +66,24 @@ class VersionEntry:
self.date: Optional[datetime.date] = None
self.tags: List[str] = []
self.link: str = ''
self.link_id: str = None
self.line_no: int = -1
def __str__(self) -> str:
if self.name.lower() == 'unreleased':
return f'## {self.name}'
if self.link:
segments = [f'[{self.name}]']
else:
segments = [self.name]
date_str = self.date.isoformat() if self.date else 'UNKNOWN'
line = f'## {self.name} - {date_str}'
for tag in self.tags:
line += ' [' + tag.upper() + ']'
if self.date or len(self.tags) > 0:
segments.append('-')
return line
if self.date:
segments.append(self.date.isoformat())
segments += [f'[{t.upper()}]' for t in self.tags]
return ' '.join(segments)
class Changelog:
@ -45,92 +91,168 @@ class Changelog:
self.path = path
self.header = ''
self.versions = []
# Read file
with open(path, 'r') as fp:
self.lines = fp.readlines()
section = ''
in_block = False
in_code = False
self.links = {}
with open(path, 'r') as fp:
# Read file
line = fp.readline()
while line and not line.startswith('##'):
self.header += line
line = fp.readline()
links = {}
segments: List[Tuple[int, List[str], str]] = []
header_segments = []
version = None
section = ''
last_line = ''
for line_no, line in enumerate(self.lines):
if in_code:
# this is the contents of a code block
segments[-1][1].append(line)
if code_regex.match(line):
in_code = False
in_block = False
while line:
if line.isspace():
# skip empty lines
pass
elif match := re.fullmatch(
r'^##\s+(?P<name>\S*)(?:\s+-\s+(?P<date>\S+))?\s*?(?P<extra>.*?)\s*#*$', line):
# this is a version header in the form '## Name (- date) (tags*) (#*)'
version = VersionEntry()
section = ''
elif code_regex.match(line):
# this is the start of a code block
in_code = True
segments.append((line_no, [line], 'code'))
version.name, version.link, version.link_id = _strip_link(match['name'])
elif under1_regex.match(line) and in_block and len(segments[-1][1]) == 1 and segments[-1][2] == 'p':
# this is an underline for a setext-style H1
# ugly but it works
last = segments.pop()
segments.append((last[0], last[1] + [line], 'h1'))
if match['date']:
elif under2_regex.match(line) and in_block and len(segments[-1][1]) == 1 and segments[-1][2] == 'p':
# this is an underline for a setext-style H2
# ugly but it works
last = segments.pop()
segments.append((last[0], last[1] + [line], 'h2'))
elif bullet_regex.match(line):
in_block = True
segments.append((line_no, [line], 'li'))
elif match := header_regex.match(line):
# this is a header
kind = f'h{len(match["hashes"])}'
segments.append((line_no, [line], kind))
in_block = False
elif match := linkid_regex.match(line):
# this is a link definition in the form '[id]: link', so add it to the link table
links[match['link_id'].lower()] = match['link']
elif line.isspace():
# skip empty lines
in_block = False
elif in_block:
# this is a line to be added to a paragraph
segments[-1][1].append(line)
else:
# this is a new paragraph
in_block = True
segments.append((line_no, [line], 'p'))
for segment in segments:
text = ''.join(segment[1]).strip()
if segment[2] == 'h2':
# start of a version
slug = text.rstrip('-').strip('#').strip()
split = slug.split()
if '-' in split:
split.remove('-')
version = VersionEntry()
section = ''
version.name = slug
version.line_no = segment[0]
tags = []
date = []
for word in split[1:]:
if match := re.match(r'\d{4}-\d{2}-\d{2}', word):
# date
try:
version.date = datetime.date.fromisoformat(match['date'].strip(string.punctuation))
date = datetime.date.fromisoformat(match[0])
except ValueError:
version.date = None
if match['extra']:
version.tags = [s.strip('[]') for s in re.findall(r'\[.*?]', match['extra'])]
self.versions.append(version)
elif match := re.fullmatch(r'###\s+(\S*?)(\s+#*)?', line):
# this is a version section header in the form '### Name' or '### Name ###'
section = match[1].title()
if section not in version.sections.keys():
version.sections[section] = []
elif match := re.fullmatch(r'\[(\S*)]:\s*(\S*)\n', line):
# this is a link definition in the form '[id]: link', so add it to the link table
self.links[match[1].lower()] = match[2]
elif line[0] in bullets or last_line.isspace():
# bullet point or new paragraph
# bullet points are preserved since some people like to use '+', '-' or '*' for different things
version.sections[section].append(line.strip())
break
elif match := re.match(r'^\[(?P<tag>\S*)]', word):
tags.append(match['tag'])
else:
break
else:
# not a bullet point, and no whitespace on last line, so append to the last entry
version.sections[section][-1] += '\n' + line.strip()
# matches the schema
version.name, version.link, version.link_id = _strip_link(split[0])
version.date = date
version.tags = tags
last_line = line
line = fp.readline()
self.versions.append(version)
elif len(self.versions) == 0:
# we haven't encountered any version headers yet,
# so its best to just add this line to the header string
header_segments.append(text)
elif segment[2] == 'h3':
# start of a version section
section = text.strip('#').strip()
if section not in self.versions[-1].sections.keys():
self.versions[-1].sections[section] = []
else:
# change log entry
self.versions[-1].sections[section].append(text)
# handle links
for version in self.versions:
if match := re.fullmatch(r'\[(.*)]', version.name):
# ref-matched link
link_id = match[1].lower()
if link_id in links:
version.link = links.pop(link_id)
version.link_id = None
version.name = match[1]
elif version.link_id in links:
# id-matched link
version.link = links.pop(version.link_id)
# strip whitespace from header
self.header = _join_markdown(header_segments)
self.links = links
def write(self, path: os.PathLike = None):
if path is None:
path = self.path
v_links = {}
v_links.update(self.links)
with open(path, 'w') as fp:
fp.write(self.header)
fp.write('\n\n')
for version in self.versions:
# handle links
if match := re.fullmatch(r'\[(.*)]', version.name):
# ref-matched link
link_id = match[1].lower()
if link_id in self.links:
version.link = self.links.pop(link_id)
version.link_id = None
version.name = match[1]
fp.write(f'## {version}\n\n')
elif version.link_id in self.links:
# id-matched link
version.link = self.links.pop(version.link_id)
if version.link:
v_links[version.name] = version.link
for section in version.sections:
if section:
fp.write(f'### {section}\n\n')
def read_version_header(line: str) -> Tuple[str, datetime.date, List[str]]:
split = line.removeprefix('##').strip().split()
name = split[0]
date = datetime.date.fromisoformat(split[2]) if len(split) > 2 else None
tags = [s.removeprefix('[').removesuffix(']') for s in split[3:]]
if len(version.sections[section]) > 0:
fp.write(_join_markdown(version.sections[section]))
fp.write('\n\n')
return name, date, tags
def write_version_header(name: str, date: datetime.date, tags=None) -> str:
line = f'## {name} - {date.isoformat()}'
if tags:
for tag in tags:
line += ' [' + tag.upper() + ']'
return line
for link_id, link in v_links.items():
fp.write(f'[{link_id.lower()}]: {link}\n')