#!/usr/bin/env python # Licensed to the Apache Software Foundation (ASF) under one or more # contributor license agreements. See the NOTICE file distributed with # this work for additional information regarding copyright ownership. # The ASF licenses this file to You under the Apache License, Version 2.0 # (the "License"); you may not use this file except in compliance with # the License. You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. ''' Purpose: Clutch gathers details about projects currently in incubation. The core resource is the SITE_CONTENT/podlings.xml file. As soon as a project is accepted into incubation, please add its entry. This script reads the SITE_CONTENT/podlings.xml table, and each podling status page, and other resources. The assembled metadata is stored in various data files. See further explanation at http://incubator.apache.org/clutch.html Note: Please keep the dependencies as minimal as possible, so this script can be operated by any Incubator committer. It uses only standard modules. Note: The 'svn log' queries might only run on UNIX, YMMV. ''' ''' External input data files used: - SITE_CONTENT/podlings.xml URLs http://people.apache.org/~crossley/incubator-keys.txt Created on minotaur using: find /www/www.apache.org/dist/incubator \ -iname "*KEYS*" | grep -v "\.svn\/" > ~/public_html/incubator-keys.txt http://people.apache.org/~crossley/incubator-releases.txt Created on minotaur using: find /www/www.apache.org/dist/incubator \ -iname "*incubat*gz.asc" -o -iname "*incubat*gz.sig" \ -o -iname "*incubat*bz2.asc" -o -iname "*incubat*bz2.sig" \ -o -iname "*incubat*zip.asc" -o -iname "*incubat*zip.sig" \ > ~/public_html/incubator-releases.txt http://people.apache.org/~crossley/incubator-releases-bad-filename.txt Created on minotaur using: find /www/www.apache.org/dist/incubator \ -iname "*gz.asc" -o -iname "*gz.sig" \ -o -iname "*bz2.asc" -o -iname "*bz2.sig" \ -o -iname "*zip.asc" -o -iname "*zip.sig" \ | sed 's/.*\/incubator\///' \ | grep -v incubat \ > ~/public_html/incubator-releases-bad-filename.txt The above has now been replaced by parsing the output of 'svn', 'ls', '-R', 'https://dist.apache.org/repos/dist/release/incubator' asf-authorization-template from Git deployment branch http://mail-archives.apache.org/mod_mbox/ http://www.apache.org/dist/incubator/ http://svn.apache.org/repos/asf/incubator SVN commands 'svn', 'ls', '-R', 'https://dist.apache.org/repos/dist/release/incubator' 'svn', 'ls', '--xml', 'http://svn.apache.org/repos/asf/incubator/' 'svn', 'log', '--xml', 'SITE_CONTENT/projects/{0}.xml' {status file} Output data files created: SITE_CONTENT/clutch.txt SITE_CONTENT/clutcho1.ent SITE_CONTENT/clutcht.ent SITE_CONTENT/clutchr1.ent SITE_CONTENT/clutchr2.ent SITE_CONTENT/clutcho2.ent SITE_CONTENT/clutchm.ent SITE_CONTENT/clutchmy.ent SITE_CONTENT/report_due_1.txt SITE_CONTENT/report_due_2.txt SITE_CONTENT/report_due_3.txt Pickle file: - clutch.pkl (I/O) ''' # FIXME: Mail list detection could be improved. # FIXME: Mail list detection. See svn comments with 2009-11-13 rush bug fix. # FIXME: Occasional trailing slash issue in Clutch cache. # FIXME: Some projects use different names in different contexts, and cannot # be automatically handled, e.g. Lucene.Net, log4php (some of their stats # are missing). # See beginning attempt to handle this with "resourceNames". # FIXME: Perhaps send some error reporting to a log file: # - validate the dates. # - detect short description, e.g. Hama = Hama # FIXME: Better/more exception handling, e.g. url open # FIXME: Need various output formats: # - source docs xml file in clutch*.ent (now happening) # - simple text list of project names and basic data clutch.txt (now happening) # - Notation3 or DOAP or RDFa or some such? (not yet) # - python pickle (now happening) # FIXME: Parse Robert's "audit" stuff. # FIXME: Detect if they have SVN repo yet. # - http://svn.apache.org/repos/asf/incubator/* ensure more than ".." # FIXME: Similarly with website. Ensure that there is some content length. # FIXME: Get better hints from Status pages, e.g. sometimes they don't link # to their "tracker" etc. they just use text. # FIXME: News parser gets extra committer if source has commented xml template. # FIXME: Use fragments via other files for the sets of html notes. # FIXME: See some other suggestions on the general@ list. # FIXME: See some other suggestions in clutch.html#notes-2 # FIXME: Better deal with input/output/unicode. # FIXME: See some other suggestions in issue INCUBATOR-78. import sys if sys.version_info < (3, 2): raise Exception("Python 3.2 or above is required") import subprocess from subprocess import Popen, PIPE import datetime from html.parser import HTMLParser import os.path import pickle import pprint import re import urllib.request import urllib.error import urllib.parse import xml.dom.minidom import argparse import io # constants for external data --- # infra moved to github ASF_AUTH_TEMPLATE = 'https://raw.githubusercontent.com/apache/infrastructure-puppet/deployment/modules/subversion_server/files/authorization/asf-authorization-template' MAIL_LIST_URL = "http://mail-archives.apache.org/mod_mbox/" # Constant for site content location --- SITE_CONTENT_DIR = 'content/' CLUTCH_CONTENT_DIR = SITE_CONTENT_DIR + 'clutch/' parser = argparse.ArgumentParser( description='Gather details about projects currently in incubation.') parser.add_argument('--ignoreState', action='store_true', default='False', help='Ignore state (default false)') parser.add_argument('-v', '--verbose', action='store_true', default='False', help='verbose mode (default false)') parser.add_argument('-q', '--quiet', action='store_true', default='False', help='quiet mode (default false)') parser.add_argument('-x', '--external', action='store_true', default='False', help='log external requests (e.g. svn, http) (default false)') args = parser.parse_args() # Normal level of info optionInfo = args.quiet != True # Issue some extra debug information. optionVerbose = args.verbose == True if optionVerbose: optionInfo = True # Use the persistent data to speed operations. # Occasionally bad data is cached (e.g. experimenting with developing new code). # So need to ignore the cached data and perform all resource availability # tests. optionUseClutchState = args.ignoreState != True # Should we log external requests? optionExternal = args.external == True # Utility functions ---- def logexternal(string): if optionExternal: print("External: " + string) def getUrl(url, encoding=None, errors=None): logexternal(url) # ensure invalid URLs don't cause long wait resp = urllib.request.urlopen(url, timeout=5) if encoding: return io.TextIOWrapper(resp, encoding=encoding, errors=errors) else: return resp def osExec(list): logexternal(" ".join(list)) return subprocess.Popen(list, stdout=subprocess.PIPE).communicate()[0] def osPopen(list): logexternal(" ".join(list)) return subprocess.Popen(list, stdout=subprocess.PIPE, universal_newlines=True) def getText(nodelist): """http://www.python.org/doc/2.5.2/lib/minidom-example.txt""" rc = "" for node in nodelist: if node.nodeType == node.TEXT_NODE: rc = rc + node.data return rc def normaliseSVNurl(url): rc = url.replace('https://', 'http://') if not rc[-1] == '/': rc = rc + '/' return rc def checkStatus(k, projectList, status): statusFile = SITE_CONTENT_DIR + "projects/{0}.xml".format(k) e = projectList[k] if os.path.exists(statusFile): try: dom = xml.dom.minidom.parse(statusFile) span = dom.getElementsByTagName("span") if (len(span) < 1): print("INFO: Missing from status file: "+statusFile) print("

The {0} project {2} on {1}

".format(e['name'], e['enddate'], status)) except (Exception) as e: print("Exception processing " + statusFile + " : " + str(e)) raise else: print("WARN: Cannot find {0}".format(statusFile)) projects = {} # internal data, derived from podlings.xml otherIssues = [] persist = {} # persistent data to be utilised by other tools mentorsProjects = {} # internal data gatherDate = datetime.datetime.utcnow() gatherDateString = datetime.datetime.utcnow().ctime() delta = datetime.timedelta(days=61) statusTallyDate1 = gatherDate - delta delta = datetime.timedelta(days=122) statusTallyDate2 = gatherDate - delta delta = datetime.timedelta(days=273) statusTallyDate3 = gatherDate - delta # Regualar expressions --- # These expressions are used often, so compile them early. startDateRE = re.compile("([0-9]+)-0?([0-9]+)-?0?([0-9]+)?") statusLogRE = re.compile("^([0-9]+)-0?([0-9]+)-0?([0-9]+)") svnRevisionSkipRE = re.compile( "707389|708087|708420|708791|709356|709648|711153|744365|761864|788239|796085|804825|894972|940767|959869|1065888|1153764|1159079|1373730|1479744|1494479|1515212") mailListRE = re.compile("^([-a-z0-9]+)@([a-z]+)\.apache\.org") mailListNameRE = re.compile("^([a-z]+)-([-a-z0-9]+)") mailListNameUrlRE = re.compile("/([a-z]+)-([-a-z0-9]+)/$") urlHttpRE = re.compile("^http") newCommitterRE = re.compile("[nN]ew [cC]omm?itt?ers? ?\(?([0-9]+)?") distMirrorRE = re.compile("cgi/incubator/([-a-z0-9]+)/") # Import the persistent data --- # This enables us to skip detection of website etc. if already detected. inputFile = open('clutch.pkl', 'rb') state = pickle.load(inputFile) inputFile.close() # Parse the podlings data file --- dom = xml.dom.minidom.parse(SITE_CONTENT_DIR + "podlings.xml") graduatedProjects = {} graduatingOrRetiring = [] retiredProjects = {} print("Gather data from podlings.xml ...") for row in dom.getElementsByTagName("podling"): name = row.getAttribute("name").strip() id = name.lower() id = id.replace(' ', '') # strip spaces from project ID startDate = row.getAttribute("startdate") endDate = row.getAttribute("enddate") if row.getAttribute("status") == 'graduated': resource = row.getAttribute("resource") graduatedProjects[resource.lower()] = {'name': name, 'enddate': endDate} if row.getAttribute("status") == 'retired': resource = row.getAttribute("resource") retiredProjects[resource.lower()] = {'name': name, 'enddate': endDate} if row.getAttribute("status") == 'current': #print("Name: " + name) if id in projects: print("ERROR: {0}: row exists".format(id)) else: projects[id] = {} # strip spaces from project name (as per original ReportingSchedule) # TODO is this still needed? Or should the @name attribute not # contain spaces? projects[id]['fullName'] = name projects[id]['name'] = name.replace(' ', '') # Set some defaults needMetadata = False projects[id]['reportingMonthly'] = False projects[id]['reportingComments'] = "" projects[id]['hasReportingGroup'] = True # currently needed for reporting phase projects[id]['reportingGroup'] = 'month' projects[id]['hasStatusEntry'] = True projects[id]['statusFileName'] = id projects[id]['statusLastUpdated'] = "" projects[id]['statusAge'] = 0 projects[id]['statusUpdateCounts'] = "" projects[id]['urlSvn'] = "" projects[id]['urlTracker'] = "" projects[id]['urlWww'] = "" projects[id]['urlDist'] = "" projects[id]['urlKeys'] = "" projects[id]['hasEntryIssues'] = False projects[id]['resourceNames'] = [id] # Some projects use an alternate short resource name # rather than their project name alias = row.getAttribute("resource") if (alias != '' and alias != id): projects[id]['resourceNames'].append(alias) for alias in row.getAttribute("resourceAliases").split(','): if alias != '': projects[id]['resourceNames'].append(alias) projects[id]['entryDate'] = None projects[id]['committersSvn'] = None projects[id]['hintMailListDev'] = "" projects[id]['hasMailListDev'] = "" projects[id]['hintMailListCommits'] = "" projects[id]['hasMailListCommits'] = "" projects[id]['numberCommitters'] = 0 projects[id]['numberCommittersNew'] = 0 projects[id]['hasClutchState'] = id in state descElements = row.getElementsByTagName("description") projects[id]['description'] = getText(descElements[0].childNodes) if 'FIXME' in projects[id]['description']: needMetadata = True projects[id]['sponsor'] = row.getAttribute("sponsor") projects[id]['startDate'] = startDate projects[id]['statusFileName'] = row.getAttribute("resource") mentors = [mentor.firstChild.data.strip() for mentor in row.getElementsByTagName("mentor")] projects[id]['mentors'] = mentors if 'FIXME' in mentors: needMetadata = True if needMetadata: errorMsg = "{0}: Need to add incubation metadata.".format(id) print('ERROR:', errorMsg) errorMsg += " Please maintain your records in the content/podlings.xml file. See help." otherIssues.append(errorMsg) # determine projects for each mentor for mentor in mentors: try: mentorsProjects[mentor] except KeyError: mentorsProjects[mentor] = [] mentorsProjects[mentor].append(name) isGraduating = row.getElementsByTagName("graduating").length > 0 if isGraduating: graduatingOrRetiring.append(id) if not row.getAttribute("endDate"): errorMsg = "{0}: Has graduated, but still needs to follow the graduation steps.".format( id) print('ERROR:', errorMsg) errorMsg += " See help." otherIssues.append(errorMsg) isRetiring = row.getElementsByTagName("retiring").length > 0 if isRetiring: graduatingOrRetiring.append(id) if not row.getAttribute("endDate"): errorMsg = "{0}: Has retired, but still needs to follow the retirement steps.".format( id) print('ERROR:', errorMsg) errorMsg += " See help." otherIssues.append(errorMsg) # Is it reporting monthly? reporting = row.getElementsByTagName("reporting") if reporting.length != 1: projects[id]['hasReportingGroup'] = False if not isGraduating: print( "ERROR: {0}: expecting a single reportgroup".format(name)) else: if reporting[0].getAttribute("monthly").lower() == 'true': projects[id]['reportingMonthly'] = True projects[id]['reportingComments'] = getText(reporting) projects[id]['hasEntryIssues'] = True group = reporting[0].getAttribute("group") if group == None: print("ERROR: {0}: missing group attribute".format(name)) projects[id]['hasReportingGroup'] = False else: projects[id]['reportingGroup'] = 'group-' + group dom.unlink() for k in sorted(graduatedProjects): checkStatus(k, graduatedProjects, 'graduated') for k in sorted(retiredProjects): checkStatus(k, retiredProjects, 'retired') # Process the incubation table data, detect some potential issues. --- print("Gather details from project status files ...") projectNames = list(projects.keys()) for k in sorted(projectNames, key=str.lower): if optionVerbose: print("DEBUG: Processing status file for {0}".format(k)) # Append more potential alternate names for a project if projects[k]['statusFileName'] not in projects[k]['resourceNames']: projects[k]['resourceNames'].append(projects[k]['statusFileName']) if optionVerbose and len(projects[k]['resourceNames']) > 1: print("DEBUG: Will try alternate names: {0}".format( projects[k]['resourceNames'])) # parse their project status file to extract specific information statusFile = SITE_CONTENT_DIR + \ "projects/{0}.xml".format(projects[k]['statusFileName']) if os.path.exists(statusFile): try: dom = xml.dom.minidom.parse(statusFile) except (Exception) as e: print("Exception processing " + statusFile + " : " + str(e)) raise # get the project info hints if optionVerbose: print("DEBUG: Gather hints from project Status page") table = dom.getElementsByTagName("table")[0] for row in table.getElementsByTagName("tr")[1:]: if (len(row.getElementsByTagName("td")) < 3): continue cell = row.getElementsByTagName("td")[2] if 'id' in cell.attributes: values = [getText(item.childNodes) for item in cell.childNodes] value = " ".join(values).strip() if value == "": value = getText(cell.childNodes).strip() if optionVerbose: print("DEBUG: Hint: {0}={1}".format( cell.getAttribute('id'), value)) if cell.getAttribute('id') == "mail-dev": value = value.replace(' at ', '@') value = value.replace(' Subscribe Unsubscribe', '') value = value.replace(' Archive', '') value = value.replace(' ', '@', 1) value = value.replace(' ', '') value = value.replace('@@', '@') matchMail = re.search(mailListRE, value) if matchMail: projects[k][ 'hintMailListDev'] = "{0}-{1}".format(matchMail.group(2), matchMail.group(1)) continue if cell.getAttribute('id') == "mail-commits": value = value.replace(' at ', '@') value = value.replace(' Subscribe Unsubscribe', '') value = value.replace(' Archive', '') value = value.replace(' ', '@', 1) value = value.replace(' ', '') value = value.replace('@@', '@') matchMail = re.search(mailListRE, value) if matchMail: projects[k][ 'hintMailListCommits'] = "{0}-{1}".format(matchMail.group(2), matchMail.group(1)) continue # Get hints for various url-based resources matchUrl = re.search(urlHttpRE, value) if not matchUrl: for item in cell.getElementsByTagName('a'): if 'href' in item.attributes: value = item.getAttribute('href') break hasUrl = re.search(urlHttpRE, value) if cell.getAttribute('id') == "svn" and hasUrl: projects[k]['urlSvn'] = value continue if cell.getAttribute('id') == "tracker" and hasUrl: projects[k]['urlTracker'] = value continue if cell.getAttribute('id') == "www" and hasUrl: projects[k]['urlWww'] = value continue # Scan the project News section and count new commiters. for section in dom.getElementsByTagName("section"): if 'id' in section.attributes and section.getAttribute('id') == "News": for line in section.toxml().splitlines(): if ('\n") if len(otherIssues): otherXml = """

other issues listed below for: """ otherIssuesRE = re.compile("^([^:]+):.*$") otherIssues.sort() for issue in otherIssues: matchOtherIssues = re.search(otherIssuesRE, issue) otherXml += '\n {0} '.format( matchOtherIssues.group(1)) otherXml += "\n

\n" fileXmlo1.write(otherXml) fileXmlo1.close() fileXmlt = open(CLUTCH_CONTENT_DIR + 'clutcht.ent', encoding='utf-8', mode='w') fileXmlt.write("\n") tableTopXml = """ Clutch last gathered: {0} UTC.
Number of podlings in incubation: {1} """.format(gatherDateString, len(projects)) fileXmlt.write(tableTopXml) fileXmlt.close() fileList.write('#identifier,name,sponsor\n') reportList1 = "" reportList2 = "" reportList3 = "" tableRowCount = 0 tableRowCountMid = int(len(projects) / 2) fileXml = open(CLUTCH_CONTENT_DIR + 'clutchr1.ent', encoding='utf-8', mode='w') fileXml.write("\n") for k in sorted(projectNames, key=str.lower): tableRowCount += 1 if tableRowCount == tableRowCountMid: fileXml.close() fileXml = open(CLUTCH_CONTENT_DIR + 'clutchr2.ent', encoding='utf-8', mode='w') fileXml.write("\n") fileXml.write(' \n'.format(k)) fileXml.write(' {0}\n'.format(projects[k]['fullName'])) persist[k] = {} persist[k]['podlingName'] = projects[k]['name'] persist[k]['fullName'] = projects[k]['fullName'] if '?' in projects[k]['sponsor']: fileXml.write( ' {0}\n'.format(projects[k]['sponsor'])) else: fileXml.write( ' {0}\n'.format(projects[k]['sponsor'])) persist[k]['sponsor'] = projects[k]['sponsor'] persist[k]['description'] = projects[k]['description'] persist[k]['mentors'] = projects[k]['mentors'] fileXml.write(' {0}\n'.format(projects[k]['startDate'])) persist[k]['startDate'] = projects[k]['startDate'] # elapsedDays column fileXml.write(' \n') if not projects[k]['reportingMonthly']: fileXml.write( ' {0}\n'.format(projects[k]['reportingMonthly'])) else: fileXml.write( ' {0}\n'.format(projects[k]['reportingMonthly'])) persist[k]['reportingMonthly'] = projects[k]['reportingMonthly'] fileXml.write( ' {0}\n'.format(projects[k]['reportingGroup'])) # save the simple group number for programs that have their own ideas. persist[k]['rawReportingGroup'] = projects[k]['reportingGroup'] persist[k]['reportingGroup'] = reportingGroups[ projects[k]['reportingGroup']] reportDevList = '"{0} Developers"'.format(projects[k]['fullName']) if projects[k]['hasMailListDev']: matchDevMail = re.search(mailListNameUrlRE, projects[ k]['hasMailListDev']) if matchDevMail: mailListGroup = None for alias in projects[k]['resourceNames']: if (alias in mailLists.newStyle): mailListGroup = alias if (mailListGroup != None): reportDevList += " ".format( mailListGroup) else: reportDevList += " <{0}@{1}.apache.org>".format( matchDevMail.group(2), matchDevMail.group(1)) else: reportDevList += " " else: reportDevList += " " if optionVerbose: print("DEBUG: {0}: reportDevList={1}".format(k, reportDevList)) reportDevList += "\n" if projects[k]['reportingMonthly']: reportList1 += reportDevList reportList2 += reportDevList reportList3 += reportDevList else: if (projects[k]['reportingGroup'] == "group-1"): reportList1 += reportDevList elif (projects[k]['reportingGroup'] == "group-2"): reportList2 += reportDevList elif (projects[k]['reportingGroup'] == "group-3"): reportList3 += reportDevList if projects[k]['hasReportingGroup']: fileXml.write( ' {0}\n'.format(projects[k]['hasReportingGroup'])) else: fileXml.write( ' {0}\n'.format(projects[k]['hasReportingGroup'])) if projects[k]['hasStatusEntry']: fileXml.write(' {1}\n'.format( projects[k]['statusFileName'], projects[k]['hasStatusEntry'])) else: fileXml.write( ' {0}\n'.format(projects[k]['hasStatusEntry'])) fileXml.write( ' {0}\n'.format(projects[k]['statusLastUpdated'])) # statusAge column fileXml.write(' \n') fileXml.write( ' {0}\n'.format(projects[k]['statusUpdateCounts'])) if projects[k]['numberCommitters'] > 0: if projects[k]['numberCommitters'] > 2: fileXml.write(' {1}\n'.format( projects[k]['committersSvn'], projects[k]['numberCommitters'])) else: fileXml.write(' {1}\n'.format( projects[k]['committersSvn'], projects[k]['numberCommitters'])) else: fileXml.write(' -\n') if projects[k]['numberCommittersNew'] > 0: if projects[k]['numberCommittersNew'] > 1: fileXml.write( ' {0}\n'.format(projects[k]['numberCommittersNew'])) else: fileXml.write( ' {0}\n'.format(projects[k]['numberCommittersNew'])) else: fileXml.write(' 0\n') if projects[k]['urlSvn']: fileXml.write( ' True\n'.format(projects[k]['urlSvn'])) else: fileXml.write(' False\n') persist[k]['urlSvn'] = projects[k]['urlSvn'] if projects[k]['urlTracker']: fileXml.write( ' True\n'.format(projects[k]['urlTracker'])) else: fileXml.write(' False\n') persist[k]['urlTracker'] = projects[k]['urlTracker'] hasUrl = re.search(urlHttpRE, projects[k]['hasMailListDev']) if hasUrl: fileXml.write( ' True\n'.format(projects[k]['hasMailListDev'])) else: fileXml.write(' False\n') persist[k]['hasMailListDev'] = projects[k]['hasMailListDev'] hasUrl = re.search(urlHttpRE, projects[k]['hasMailListCommits']) if hasUrl: fileXml.write(' True\n'.format( projects[k]['hasMailListCommits'])) else: fileXml.write(' False\n') persist[k]['hasMailListCommits'] = projects[k]['hasMailListCommits'] if projects[k]['urlWww']: fileXml.write( ' True\n'.format(projects[k]['urlWww'])) else: fileXml.write(' False\n') persist[k]['urlWww'] = projects[k]['urlWww'] if projects[k]['urlDist']: fileXml.write( ' True\n'.format(projects[k]['urlDist'])) else: fileXml.write(' False\n') persist[k]['urlDist'] = projects[k]['urlDist'] if projects[k]['urlKeys']: fileXml.write( ' True\n'.format(projects[k]['urlKeys'])) else: fileXml.write(' False\n') match = re.search(distMirrorRE, projects[k]['urlDist']) if match: if match.group(1) in releases: fileXml.write( ' True\n'.format(projects[k]['urlDist'])) else: fileXml.write(' False\n') else: fileXml.write(' False\n') fileXml.write(' \n') fileList.write('{0},"{1}","{2}"\n'.format( k, projects[k]['name'], projects[k]['sponsor'])) fileXml.close() # End of rows # Other issues fileXmlo2 = open(CLUTCH_CONTENT_DIR + 'clutcho2.ent', encoding='utf-8', mode='w') fileXmlo2.write("\n") if len(otherIssues): otherIssues.sort() for issue in otherIssues: fileXmlo2.write("

{0}

\n".format(issue)) else: fileXmlo2.write("

No known issues.

\n") fileXmlo2.close() mentors = list(mentorsProjects.keys()) mentors.sort() fileXmlm = open(CLUTCH_CONTENT_DIR + 'clutchm.ent', encoding='utf-8', mode='w') fileXmlm.write("\n") for mentor in mentors: fileXmlm.write("

{0}: {1}

\n".format( mentor, ', '.join(mentorsProjects[mentor]))) fileXmlm.close() fileList.close() fileReport1 = open(CLUTCH_CONTENT_DIR + 'report_due_1.txt', 'w') fileReport1.write(reportList1) fileReport1.close() fileReport2 = open(CLUTCH_CONTENT_DIR + 'report_due_2.txt', 'w') fileReport2.write(reportList2) fileReport2.close() fileReport3 = open(CLUTCH_CONTENT_DIR + 'report_due_3.txt', 'w') fileReport3.write(reportList3) fileReport3.close() # Create the persistent data file. outputFile = open('clutch.pkl', 'wb') pickle.dump(persist, outputFile, protocol=3) outputFile.close() print("Done. Generated clutch*.ent files.") print("Now you need to re-build the site, as usual.")