api/pages/code/pony.py (181 lines of code) (raw):

#!/usr/bin/env python3 # -*- coding: utf-8 -*- # Licensed to the Apache Software Foundation (ASF) under one or more # contributor license agreements. See the NOTICE file distributed with # this work for additional information regarding copyright ownership. # The ASF licenses this file to You under the Apache License, Version 2.0 # (the "License"); you may not use this file except in compliance with # the License. You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. ######################################################################## # OPENAPI-URI: /api/code/pony ######################################################################## # get: # responses: # '200': # content: # application/json: # schema: # $ref: '#/components/schemas/Factor' # description: 200 Response # default: # content: # application/json: # schema: # $ref: '#/components/schemas/Error' # description: unexpected error # security: # - cookieAuth: [] # summary: Shows pony factor data for a set of repos over a given period of time # post: # requestBody: # content: # application/json: # schema: # $ref: '#/components/schemas/defaultWidgetArgs' # responses: # '200': # content: # application/json: # schema: # $ref: '#/components/schemas/Factor' # description: 200 Response # default: # content: # application/json: # schema: # $ref: '#/components/schemas/Error' # description: unexpected error # security: # - cookieAuth: [] # summary: Shows pony factor data for a set of repos over a given period of time # ######################################################################## """ This is the pony factor renderer for Kibble """ import json import time import re def run(API, environ, indata, session): # We need to be logged in for this! if not session.user: raise API.exception(403, "You must be logged in to use this API endpoint! %s") now = time.time() # First, fetch the view if we have such a thing enabled viewList = [] if indata.get('view'): viewList = session.getView(indata.get('view')) if indata.get('subfilter'): viewList = session.subFilter(indata.get('subfilter'), view = viewList) dateTo = indata.get('to', int(time.time())) dateFrom = indata.get('from', dateTo - (86400*30*24)) # Default to a 24 month span if dateFrom < 0: dateFrom = 0 dateYonder = dateFrom - (dateTo - dateFrom) #################################################################### #################################################################### dOrg = session.user['defaultOrganisation'] or "apache" query = { 'query': { 'bool': { 'must': [ {'range': { 'tsday': { 'from': dateFrom, 'to': dateTo } } }, { 'term': { 'organisation': dOrg } } ] } } } # Source-specific or view-specific?? if indata.get('source'): query['query']['bool']['must'].append({'term': {'sourceID': indata.get('source')}}) elif viewList: query['query']['bool']['must'].append({'terms': {'sourceID': viewList}}) # Get an initial count of commits res = session.DB.ES.count( index=session.DB.dbname, doc_type="code_commit", body = query ) globcount = res['count'] # Get top 25 committers this period query['aggs'] = { 'by_committer': { 'terms': { 'field': 'committer_email', 'size': 5000 } }, 'by_author': { 'terms': { 'field': 'author_email', 'size': 5000 } } } res = session.DB.ES.search( index=session.DB.dbname, doc_type="code_commit", size = 0, body = query ) # PF for committers pf_committer = 0 pf_committer_count = 0 for bucket in res['aggregations']['by_committer']['buckets']: count = bucket['doc_count'] pf_committer += 1 pf_committer_count += count if pf_committer_count > int(globcount/2): break # PF for authors pf_author = 0 pf_author_count = 0 cpf = {} for bucket in res['aggregations']['by_author']['buckets']: count = bucket['doc_count'] pf_author += 1 pf_author_count += count mldom = bucket['key'].lower().split('@')[1] cpf[mldom] = True if pf_author_count > int(globcount/2): break #################################################################### #################################################################### dOrg = session.user['defaultOrganisation'] or "apache" query = { 'query': { 'bool': { 'must': [ {'range': { 'tsday': { 'from': dateYonder, 'to': dateFrom-1 } } }, { 'term': { 'organisation': dOrg } } ] } } } # Source-specific or view-specific?? if indata.get('source'): query['query']['bool']['must'].append({'term': {'sourceID': indata.get('source')}}) elif viewList: query['query']['bool']['must'].append({'terms': {'sourceID': viewList}}) # Get an initial count of commits res = session.DB.ES.count( index=session.DB.dbname, doc_type="code_commit", body = query ) globcount = res['count'] # Get top 25 committers this period query['aggs'] = { 'by_committer': { 'terms': { 'field': 'committer_email', 'size': 5000 } }, 'by_author': { 'terms': { 'field': 'author_email', 'size': 5000 } } } res = session.DB.ES.search( index=session.DB.dbname, doc_type="code_commit", size = 0, body = query ) # PF for committers pf_committer_b = 0 pf_committer_count = 0 for bucket in res['aggregations']['by_committer']['buckets']: count = bucket['doc_count'] pf_committer_b += 1 pf_committer_count += count if pf_committer_count > int(globcount/2): break # PF for authors pf_author_b = 0 pf_author_count = 0 cpf_b = {} for bucket in res['aggregations']['by_author']['buckets']: count = bucket['doc_count'] pf_author_b += 1 pf_author_count += count mldom = bucket['key'].lower().split('@')[1] cpf_b[mldom] = True if pf_author_count > int(globcount/2): break JSON_OUT = { 'factors': [ { 'title': "Pony Factor (by committership)", 'count': pf_committer, 'previous': pf_committer_b }, { 'title': "Pony Factor (by authorship)", 'count': pf_author, 'previous': pf_author_b }, { 'title': "Meta-Pony Factor (by authorship)", 'count': len(cpf), 'previous': len(cpf_b) } ], 'okay': True, 'responseTime': time.time() - now, } yield json.dumps(JSON_OUT)