esc-mentoring

added license-analyze. This script checks for consistency between the different license files. Remark, this script controls the requiremnt from gitdm-config, as well as esc-mentoring. But do not check the requirements from the foundation.
author: jan Iversen <jani@documentfoundation.org> 2017-02-01 07:52:42 +0100
committer: jan Iversen <jani@documentfoundation.org> 2017-02-01 07:52:42 +0100
commit: cc88d54feff23c168ee07ca7914cc1eb7fbfedcc (patch)
tree: fde5b094fcfdbcfc470c2e5219d53cc9aed3ce82
parent: bd5992e381753f11164c38cdac70970e98b09f52 (diff)
1 files changed, 252 insertions, 0 deletions
diff --git a/esc-reporting/license-analyze.py b/esc-reporting/license-analyze.py
new file mode 100755
index 0000000..584d5c6
--- /dev/null
+++ b/esc-reporting/license-analyze.py
@@ -0,0 +1,252 @@
+#!/usr/bin/env python3
+#
+# This file is part of the LibreOffice project.
+#
+# This Source Code Form is subject to the terms of the Mozilla Public
+# License, v. 2.0. If a copy of the MPL was not distributed with this
+# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+#
+
+
+
+### DESCRIPTION
+#
+# This program controls the license files:
+# 1) loads aliases, license*, domain-map
+# 2) write sorted versions of aliases (special handling due to ' ' seperator) and license*
+# 3) look for and load wiki.txt
+# 4) check consistency
+# 5) write newwiki.txt with wiki updates
+# 6) write warnings about inconsistences
+#
+
+
+
+import sys
+import csv
+import io
+import os
+import operator
+import datetime
+import collections
+
+
+
+def load_alias(homeDir):
+    rawData = collections.OrderedDict()
+    tmpData = collections.OrderedDict()
+    fileName = homeDir + 'aliases'
+
+    try:
+        with open(fileName, 'r') as fp:
+            for line in fp:
+                line = line[:-1]
+                if line.startswith('#') or line.startswith(' ') or len(line) == 0:
+                    continue
+                if line.startswith('"'):
+                    x = line.index('"', 1)
+                    result = [line[1:x], line[x+2:]]
+                else:
+                    result = line.split(' ')
+                if result[0] in tmpData:
+                    print('>>> aliases ' + result[0] + ' DUPLICATED')
+                if result[1] in tmpData:
+                    print('>>> aliases ' + result[0] + ' Target also alias')
+                if result[0].lower() != result[0]:
+                    print('>>> aliases ' + result[0] + ' Alias contains capital letters')
+                if result[1].lower() != result[1]:
+                    print('>>> aliases ' + result[1] + ' Target contains capital letters')
+                if result[0] == result[1]:
+                    print('>>> aliases ' + result[0] + ' Target == Alias')
+                for i in tmpData:
+                    if result[0] == tmpData[i]:
+                        print('>>> aliases ' + result[0] + ' Alias also target')
+                        break
+                tmpData[result[0]] = result[1]
+        oldTarget = ''
+        doSort = False
+        for entry in tmpData:
+            if tmpData[entry] < oldTarget:
+                doSort = True
+                break
+            oldTarget = tmpData[entry]
+        if doSort:
+            s = [(k, tmpData[k]) for k in sorted(tmpData, key=tmpData.get)]
+            for i in s:
+                rawData[i[0]] = i[1]
+            with open(fileName, 'w') as fp:
+                for entry in rawData:
+                    if ' ' in entry:
+                        print('"' + entry + '" ' + rawData[entry], file=fp)
+                    else:
+                        print(entry + ' ' + rawData[entry], file=fp)
+        else:
+            rawData = tmpData
+    except Exception as e:
+      print('>>> Error load file ' + fileName + ' due to ' + str(e))
+      rawData = None
+    return rawData
+
+
+
+def load_domainmap(homeDir):
+    rawData = []
+    fileName = homeDir + 'domain-map'
+    try:
+        with open(fileName, 'r') as fp:
+            for line in fp:
+                line = line[:-1]
+                if line.startswith('#') or line.startswith(' ') or len(line) == 0:
+                    continue
+                if '\t' in line:
+                    mail = line[:line.index('\t')]
+                else:
+                    mail = line[:line.index(' ')]
+                if '@' in mail and mail not in rawData:
+                    if mail.lower() != mail:
+                        print('>>> domain-map ' + mail + ' mail contains capital letters')
+                    rawData.append(mail)
+    except Exception as e:
+      print('Error load file ' + fileName + ' due to ' + str(e))
+      rawData = None
+    return rawData
+
+
+
+def load_licensePersonal(homeDir):
+    rawData = collections.OrderedDict()
+    fileName = homeDir + 'licensePersonal.csv'
+    orgText = []
+    try:
+        with open(fileName, 'r') as fp:
+            for line in fp:
+                line = line[:-1]
+                orgText.append(line)
+                if line.startswith('#') or line.startswith(' ') or len(line) == 0:
+                    continue
+                data = line.split(';')
+                if data[0].lower() != data[0]:
+                    print('>>> personalLicense.csv ' + data[0] + ' mail contains capital letters')
+                if data[0] in rawData:
+                    print('>>> personalLicense.csv ' + data[0] + ' duplicate')
+                rawData[data[0]] = {'name': data[1], 'license': data[2]}
+        newText = sorted(orgText)
+        if newText != orgText:
+            with open(fileName, 'w') as fp:
+                for line in newText:
+                   print(line, file=fp)
+    except Exception as e:
+      print('Error load file ' + fileName + ' due to ' + str(e))
+      rawData = None
+    return rawData
+
+
+
+def load_wiki(homeDir):
+    rawData = []
+    fileName = homeDir + 'wiki.txt'
+    try:
+        with open(fileName, 'r') as fp:
+            doCollect = 0
+            for line in fp:
+                if not line.startswith('|') or line.startswith('|}'):
+                    continue
+                if line.startswith('|-'):
+                    doCollect = 1
+                    data = {'name': '', 'email': '', 'license': ''}
+                    # Structure:
+                    # 1:    Wiki user name
+                    # 2:    Real name
+                    # 3:    Git email
+                    # 4:    IRC nick
+                    # 5:    Affiliation
+                    # 6:    License
+                elif doCollect in [1,4,5]:
+                    doCollect += 1
+                elif doCollect == 2:
+                    data['name'] = line[2:-1]
+                    doCollect = 3
+                elif doCollect == 3:
+                    x = line[2:-1]
+                    if x.endswith('}}'):
+                        x = x[:-2]
+                    z = x.find('|')
+                    if z > 0:
+                        x = x[z+1:]
+                    x = x.replace('|', '@')
+                    data['email'] = x
+                    doCollect = 4
+                elif doCollect == 6:
+                    x = line[2:-1]
+                    if x.startswith('['):
+                        x = x[1:]
+                    if x.endswith(']'):
+                        x = x[:-1]
+                    data['license'] = x
+                    rawData.append(data)
+                    doCollect = 0
+    except Exception as e:
+      print('Error load file ' + fileName + ' due to ' + str(e))
+      rawData = None
+    return rawData
+
+
+
+def checkConsistency(aliases, domain, license):
+    for dMail in domain:
+        if not dMail in license:
+            print('>>> domain-map ' + dMail + ' not in licensePersonal !')
+        if dMail in aliases:
+            print('>>> domain-map ' + dMail + ' used as aliaes in aliases !')
+    for entry in aliases:
+        if entry in license:
+            print('>>> aliases ' + entry + ' alias is licensed !')
+        if not aliases[entry] in license:
+            print('>>> aliases ' + aliases[entry] + ' target is not licensed !')
+
+
+
+def checkWiki(homedir, license, aliases, wiki):
+    names = {}
+    for i in license:
+        names[license[i]['name']] = i
+    for data in wiki:
+        email = data['email'].lower()
+        if email in aliases:
+            email = aliases[email]
+        if email in license:
+            license[email]['inWiki'] = True
+            continue;
+        if data['name'] in names:
+            license[names[data['name']]]['inWiki'] = True
+            continue;
+        print("wiki entry missing license: " + str(data))
+    todo = {}
+    for i in license:
+        if 'inWiki' not in license[i] and license[i]['license'].startswith('http'):
+            todo[license[i]['name']] = i
+    with open(homedir + 'wiki.new', 'w') as fp:
+        for i in sorted(todo):
+            entry = license[todo[i]]
+            if entry['name'] != 'NO NAME':
+                print('| ', file=fp)
+                print('| ' + entry['name'], file=fp)
+                print('| {{nospam|' + todo[i].replace('@', '|') + '}}', file=fp)
+                print('| ', file=fp)
+                print('| Individual', file=fp)
+                print('| [' + entry['license'] + ']', file=fp)
+                print('|-', file=fp)
+
+def runCompare(homedir):
+    dataAliases = load_alias(homedir)
+    dataDomainMail = load_domainmap(homedir)
+    dataLicenseMail = load_licensePersonal(homedir)
+    dataWiki = load_wiki(homedir)
+
+    checkConsistency(dataAliases, dataDomainMail, dataLicenseMail)
+    checkWiki(homedir, dataLicenseMail, dataAliases, dataWiki)
+    print('all done')
+
+
+if __name__ == '__main__':
+    runCompare('./')
author	jan Iversen <jani@documentfoundation.org>	2017-02-01 07:52:42 +0100
committer	jan Iversen <jani@documentfoundation.org>	2017-02-01 07:52:42 +0100
commit	cc88d54feff23c168ee07ca7914cc1eb7fbfedcc (patch)
tree	fde5b094fcfdbcfc470c2e5219d53cc9aed3ce82
parent	bd5992e381753f11164c38cdac70970e98b09f52 (diff)