Author: hboutemy Date: Sat May 9 16:51:29 2015 New Revision: 1678501 URL: http://svn.apache.org/r1678501 Log: renamed committers.json to groups.json and projects field to groups to better match data source, ie LDAP groups Added: comdev/projects.apache.org/site/json/foundation/groups.json - copied unchanged from r1678500, comdev/projects.apache.org/site/json/foundation/committers.json Removed: comdev/projects.apache.org/site/json/foundation/committers.json Modified: comdev/projects.apache.org/scripts/README.txt comdev/projects.apache.org/scripts/cronjobs/parsecommitters.py comdev/projects.apache.org/site/js/projects.js comdev/projects.apache.org/site/json/foundation/.htaccess comdev/projects.apache.org/site/json/foundation/HEADER.html comdev/projects.apache.org/site/json/foundation/people.json Modified: comdev/projects.apache.org/scripts/README.txt URL: http://svn.apache.org/viewvc/comdev/projects.apache.org/scripts/README.txt?rev=1678501&r1=1678500&r2=1678501&view=diff ============================================================================== --- comdev/projects.apache.org/scripts/README.txt (original) +++ comdev/projects.apache.org/scripts/README.txt Sat May 9 16:51:29 2015 @@ -14,8 +14,8 @@ various sources: - parsecommitters.py: Fetches and parses the committer (LDAP) list via people.apache.org. in: http://people.apache.org/committer-index.html - out: foundation/people.json + foundation/committers.json - List of committers with reference to projects (people.json) and pmcs with corresponding committers (committers.json) + out: foundation/people.json + foundation/groups.json + List of committers with reference to groups (people.json) and groups with corresponding committers (groups.json) - podlings.py: Reads podlings.xml from the incubator site and creates a JSON with timeline data, as well as current podling projects information. @@ -50,4 +50,4 @@ various sources: list of PMCs with site url (pmcs.json) and monthly list of new committees (committees.json) -Notice: cycles.json is not imported from anywhere +Notice: cycles.json is not imported from anywhere (could/should be from committee-info.txt) Modified: comdev/projects.apache.org/scripts/cronjobs/parsecommitters.py URL: http://svn.apache.org/viewvc/comdev/projects.apache.org/scripts/cronjobs/parsecommitters.py?rev=1678501&r1=1678500&r2=1678501&view=diff ============================================================================== --- comdev/projects.apache.org/scripts/cronjobs/parsecommitters.py (original) +++ comdev/projects.apache.org/scripts/cronjobs/parsecommitters.py Sat May 9 16:51:29 2015 @@ -1,12 +1,9 @@ -from xml.dom import minidom -import xml.etree.ElementTree as ET -import re, urllib.request -import csv +import re +import urllib.request import json -import os people = {} -pmcs = {} +groups = {} data = urllib.request.urlopen("http://people.apache.org/committer-index.html").read().decode('utf-8') x = 0 for committer in re.findall(r"([\S\s]+?)", data, re.MULTILINE | re.UNICODE): @@ -16,19 +13,19 @@ for committer in re.findall(r"([\S\s if m: cid = m.group(1) cname = re.sub(r"<.+?>", "", m.group(2), 4) - cproj = m.group(3) - projects = [] + groupsString = m.group(3) + cgroups = [] isMember = False if re.search(r"cronjobs/countaccounts.py" accounts.json AddDescription "generated by cronjobs/parsechairs.py" chairs.json AddDescription "imported with import/parsecommittees.py" committees.json -AddDescription "generated by cronjobs/parsecommitters.py" committers.json AddDescription "manually maintained" cycles.json AddDescription "generated by cronjobs/podlings.py" evolution.json +AddDescription "generated by cronjobs/parsecommitters.py" groups.json AddDescription "generated by cronjobs/parsecommitters.py" people.json AddDescription "imported with import/parsepmcs.py from PMC DOAP files" pmcs.json AddDescription "generated by cronjobs/podlings.py" podlings.json Modified: comdev/projects.apache.org/site/json/foundation/HEADER.html URL: http://svn.apache.org/viewvc/comdev/projects.apache.org/site/json/foundation/HEADER.html?rev=1678501&r1=1678500&r2=1678501&view=diff ============================================================================== --- comdev/projects.apache.org/site/json/foundation/HEADER.html (original) +++ comdev/projects.apache.org/site/json/foundation/HEADER.html Sat May 9 16:51:29 2015 @@ -6,9 +6,9 @@ for more information.
  • accounts.json generated by cronjobs/countaccounts.py from LDAP
  • chairs.json generated by cronjobs/parsechairs.py from http://www.apache.org/foundation/
  • committees.json imported with import/parsecommittees.py from https://svn.apache.org/repos/private/committers/board/committee-info.txt
  • -
  • committers.json and people.json generated by cronjobs/parsecommitters.py from http://people.apache.org/committer-index.html
  • cycles.json manually maintained
  • evolution.json and podlings.json generated by cronjobs/podlings.py from http://incubator.apache.org/podlings.xml
  • +
  • groups.json and people.json generated by cronjobs/parsecommitters.py from http://people.apache.org/committer-index.html
  • pmcs.json imported with import/parsepmcs.py from PMC DOAP files
  • projects.json imported with import/rdfparse.py from projects' DOAP files
  • releases.json generated by cronjobs/parsereleases.py from http://www.apache.org/dist/