api/pages/mail/top-authors.py (89 lines of code) (raw):
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
########################################################################
# OPENAPI-URI: /api/mail/top-authors
########################################################################
# get:
# responses:
# '200':
# content:
# application/json:
# schema:
# $ref: '#/components/schemas/CommitterList'
# description: 200 Response
# default:
# content:
# application/json:
# schema:
# $ref: '#/components/schemas/Error'
# description: unexpected error
# security:
# - cookieAuth: []
# summary: Shows the top N of email authors
# post:
# requestBody:
# content:
# application/json:
# schema:
# $ref: '#/components/schemas/defaultWidgetArgs'
# responses:
# '200':
# content:
# application/json:
# schema:
# $ref: '#/components/schemas/CommitterList'
# description: 200 Response
# default:
# content:
# application/json:
# schema:
# $ref: '#/components/schemas/Error'
# description: unexpected error
# security:
# - cookieAuth: []
# summary: Shows the top N of email authors
#
########################################################################
"""
This is the TopN committers list renderer for Kibble
"""
import json
import time
import hashlib
import re
ROBITS = r"(git|jira|jenkins|gerrit)@"
def run(API, environ, indata, session):
# We need to be logged in for this!
if not session.user:
raise API.exception(403, "You must be logged in to use this API endpoint! %s")
now = time.time()
# First, fetch the view if we have such a thing enabled
viewList = []
if indata.get('view'):
viewList = session.getView(indata.get('view'))
if indata.get('subfilter'):
viewList = session.subFilter(indata.get('subfilter'), view = viewList)
dateTo = indata.get('to', int(time.time()))
dateFrom = indata.get('from', dateTo - (86400*30*6)) # Default to a 6 month span
interval = indata.get('interval', 'month')
####################################################################
####################################################################
dOrg = session.user['defaultOrganisation'] or "apache"
query = {
'query': {
'bool': {
'must': [
{'range':
{
'ts': {
'from': dateFrom,
'to': dateTo
}
}
},
{
'term': {
'organisation': dOrg
}
}
]
}
}
}
# Source-specific or view-specific??
if indata.get('source'):
query['query']['bool']['must'].append({'term': {'sourceID': indata.get('source')}})
elif viewList:
query['query']['bool']['must'].append({'terms': {'sourceID': viewList}})
# Get top 25 committers this period
query['aggs'] = {
'authors': {
'terms': {
'field': 'sender',
'size': 30
}
}
}
res = session.DB.ES.search(
index=session.DB.dbname,
doc_type="email",
size = 0,
body = query
)
people = {}
for bucket in res['aggregations']['authors']['buckets']:
email = bucket['key']
# By default, we want to see humans, not bots on this list!
if re.match(ROBITS, email):
continue
count = bucket['doc_count']
sha = hashlib.sha1( ("%s%s" % (dOrg, email)).encode('utf-8') ).hexdigest()
if session.DB.ES.exists(index=session.DB.dbname,doc_type="person",id = sha):
pres = session.DB.ES.get(
index=session.DB.dbname,
doc_type="person",
id = sha
)
person = pres['_source']
person['name'] = person.get('name', 'unknown')
people[email] = person
people[email]['gravatar'] = hashlib.md5(person.get('email', 'unknown').encode('utf-8')).hexdigest()
people[email]['count'] = count
topN = []
for email, person in people.items():
topN.append(person)
topN = sorted(topN, key = lambda x: x['count'], reverse = True)
JSON_OUT = {
'topN': {
'denoter': 'emails',
'items': topN
},
'sorted': people,
'okay': True,
'responseTime': time.time() - now
}
yield json.dumps(JSON_OUT)