kallithea Files · scripts/update-copyrights.py

Files @ 11cae16e5a5d

Branch filter:

Location: kallithea/scripts/update-copyrights.py - annotation

11cae16e5a5d 6.4 KiB text/x-python Show Source Show as Raw Download as Raw

mads

setup: use old importlib_metadata version to fix kombu failing on python < 3.8

Many libraries use the importlib_metadata library as fallback when running on
Python versions older than 3.8 . For example setuptools when easy_install is
used for install the Kallithea console_scripts entrypoints in the bin folder.
The dependencies on importlib_metadata were indirect and without constrains on
version number.

The problem is that Celery uses Kombu, which (on Python < 3.8) uses
importlib_metadata in a way that is incompatible with importlib_metadata > 5.

Most obvious, building docs failed as:
Running Sphinx v5.1.1

Configuration error:
There is a programmable error in your configuration file:

Traceback (most recent call last):
File ".../kallithea/venv/lib64/python3.7/site-packages/sphinx/config.py", line 347, in eval_config_file
exec(code, namespace)
File ".../kallithea/docs/conf.py", line 17, in <module>
import kallithea
File ".../kallithea/kallithea/__init__.py", line 45, in <module>
CELERY_APP = celery.Celery() # needed at import time but is lazy and can be configured later
File ".../kallithea/venv/lib64/python3.7/site-packages/celery/local.py", line 492, in __getattr__
[name])
File ".../kallithea/venv/lib64/python3.7/site-packages/celery/app/__init__.py", line 2, in <module>
from celery import _state
File ".../kallithea/venv/lib64/python3.7/site-packages/celery/_state.py", line 15, in <module>
from celery.utils.threads import LocalStack
File ".../kallithea/venv/lib64/python3.7/site-packages/celery/utils/__init__.py", line 16, in <module>
from .nodenames import nodename, nodesplit, worker_direct
File ".../kallithea/venv/lib64/python3.7/site-packages/celery/utils/nodenames.py", line 6, in <module>
from kombu.entity import Exchange, Queue
File ".../kallithea/venv/lib64/python3.7/site-packages/kombu/entity.py", line 7, in <module>
from .serialization import prepare_accept_content
File ".../kallithea/venv/lib64/python3.7/site-packages/kombu/serialization.py", line 440, in <module>
for ep, args in entrypoints('kombu.serializers'): # pragma: no cover
File ".../kallithea/venv/lib64/python3.7/site-packages/kombu/utils/compat.py", line 82, in entrypoints
for ep in importlib_metadata.entry_points().get(namespace, [])
AttributeError: 'EntryPoints' object has no attribute 'get'

That made readthedocs builds fail, when it in the default web configuration
used Python 3.7 .

Fixed by introducing an explicit dependency on importlib_metadata < 5.

aa6f17a53b49
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
0a277465fddf
96b43734025f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
f9988201a3c4
d6ccf6a9fd11
d6ccf6a9fd11
d6ccf6a9fd11
d6ccf6a9fd11
d6ccf6a9fd11
d6ccf6a9fd11
d6ccf6a9fd11
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
27d6f56ade84
27d6f56ade84
27d6f56ade84
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
665dfa112f2c
5dde581f703f
5dde581f703f
665dfa112f2c
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
050a94de8e7f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
a44228cd208b
050a94de8e7f
050a94de8e7f
68bbfd164b23
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
a44228cd208b
050a94de8e7f
050a94de8e7f
68bbfd164b23
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
050a94de8e7f
5dde581f703f
68bbfd164b23
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
f68db0c03a78
f68db0c03a78
f68db0c03a78
f68db0c03a78
f68db0c03a78
f68db0c03a78
68bbfd164b23
f68db0c03a78
66e8dbd4b571
f68db0c03a78
f68db0c03a78
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f
5dde581f703f

#!/usr/bin/env python3
# -*- coding: utf-8 -*-

"""
Kallithea script for maintaining contributor lists from version control
history.

This script and the data in it is a best effort attempt at reverse engineering
previous attributions and correlate that with version control history while
preserving all existing copyright statements and attribution. This script is
processing and summarizing information found elsewhere - it is not by itself
making any claims. Comments in the script are an attempt at reverse engineering
possible explanations - they are not showing any intent or confirming it is
correct.

Three files are generated / modified by this script:

kallithea/templates/about.html claims to show copyright holders, and the GPL
license requires such existing "legal notices" to be preserved. We also try to
keep it updated with copyright holders, but do not claim it is a correct list.

CONTRIBUTORS has the purpose of giving credit where credit is due and list all
the contributor names in the source.

kallithea/templates/base/base.html contains the copyright years in the page
footer.

Both make a best effort of listing all copyright holders, but revision control
history might be a better and more definitive source.

Contributors are sorted "fairly" by copyright year and amount of
contribution.

New contributors are listed, without considering if the contribution contains
copyrightable work.

When the copyright might belong to a different legal entity than the
contributor, the legal entity is given credit too.
"""

import os
import re
from collections import defaultdict

import contributor_data


def sortkey(x):
    """Return key for sorting contributors "fairly":
    * latest contribution
    * first contribution
    * number of contribution years
    * name (with some unicode normalization)
    The entries must be 2-tuples of a list of string years and the name"""
    years, name = x
    if not years:
        years = ['0']
    return (-int(years[-1]),  # primarily sort by latest contribution
            int(years[0]),  # then sort by first contribution
            -len(years),  # then sort by length of contribution (no gaps)
            name.lower().replace('\xe9', 'e').replace('\u0142', 'l')  # finally sort by name
        )


def nice_years(l, dash='-', join=' '):
    """Convert a list of years into brief range like '1900-1901, 1921'."""
    if not l:
        return ''
    start = end = int(l[0])
    ranges = []
    for year in l[1:] + [0]:
        year = int(year)
        if year == end + 1:
            end = year
            continue
        if start == end:
            ranges.append('%s' % start)
        else:
            ranges.append('%s%s%s' % (start, dash, end))
        start = end = year
    assert start == 0 and end == 0, (start, end)
    return join.join(ranges)


def insert_entries(
        filename,
        all_entries,
        no_entries,
        domain_extra,
        split_re,
        normalize_name,
        format_f):
    """Update file with contributor information.
    all_entries: list of tuples with year and name
    no_entries: set of names or name and year tuples to ignore
    domain_extra: map domain name to extra credit name
    split_re: regexp matching the part of file to rewrite
    normalize_name: function to normalize names for grouping and display
    format_f: function formatting year list and name to a string
    """
    name_years = defaultdict(set)

    for year, name in all_entries:
        if name in no_entries or (name, year) in no_entries:
            continue
        parts = name.split(' <', 1)
        if len(parts) == 2:
            name = parts[0] + ' <' + parts[1].lower()
        domain = name.split('@', 1)[-1].rstrip('>')
        if domain in domain_extra:
            name_years[domain_extra[domain]].add(year)
        name_years[normalize_name(name)].add(year)

    l = [(list(sorted(year for year in years if year)), name)
         for name, years in name_years.items()]
    l.sort(key=sortkey)

    with open(filename) as f:
        pre, post = re.split(split_re, f.read())

    with open(filename, 'w') as f:
        f.write(pre +
                ''.join(format_f(years, name) for years, name in l) +
                post)


def main():
    repo_entries = [
        (year, contributor_data.name_fixes.get(name) or contributor_data.name_fixes.get(name.rsplit('<', 1)[0].strip()) or name)
        for year, name in
        (line.strip().split(' ', 1)
         for line in os.popen("""hg log -r '::.' -T '{date(date,"%Y")} {author}\n'""").readlines())
        ]

    insert_entries(
        filename='kallithea/templates/about.html',
        all_entries=repo_entries + contributor_data.other_about + contributor_data.other,
        no_entries=contributor_data.no_about,
        domain_extra=contributor_data.domain_extra,
        split_re=r'(?:  <li>Copyright &copy; [^\n]+</li>\n)+',
        normalize_name=lambda name: name.split('<', 1)[0].strip(),
        format_f=lambda years, name: '  <li>Copyright &copy; %s, %s</li>\n' % (nice_years(years, '&ndash;', ', '), name),
        )

    insert_entries(
        filename='CONTRIBUTORS',
        all_entries=repo_entries + contributor_data.other_contributors + contributor_data.other,
        no_entries=contributor_data.total_ignore,
        domain_extra=contributor_data.domain_extra,
        split_re=r'(?:    [^\n]+\n)+',
        normalize_name=lambda name: name,
        format_f=lambda years, name: ('    %s%s%s\n' % (name, ' ' if years else '', nice_years(years))),
        )

    insert_entries(
        filename='kallithea/templates/base/base.html',
        all_entries=repo_entries,
        no_entries=contributor_data.total_ignore,
        domain_extra={},
        split_re=r'(?<=&copy;) .+ (?=by various authors)',
        normalize_name=lambda name: '',
        format_f=lambda years, name: ' ' + nice_years(years, '&ndash;', ', ') + ' ',
        )

    #docs/conf.py:copyright = u'2010-2016 by various authors, licensed as GPLv3.'
    insert_entries(
        filename='docs/conf.py',
        all_entries=repo_entries,
        no_entries=contributor_data.total_ignore,
        domain_extra={},
        split_re=r"(?<=copyright = ').+(?= by various authors)",
        normalize_name=lambda name: '',
        format_f=lambda years, name: nice_years(years, '-', ', '),
        )


if __name__ == '__main__':
    main()


# To list new contributors since last tagging:
# { hg log -r '::tagged()' -T '    {author}\n    {author}\n'; hg log -r '::.' -T '    {author}\n' | sort | uniq; } | sort | uniq -u