chromium-dashboard/api/metricsdata.py

246 строки
7.7 KiB
Python
Executable File

# -*- coding: utf-8 -*-
# Copyright 2013 Google Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License")
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
__author__ = 'ericbidelman@chromium.org (Eric Bidelman)'
import datetime
import json
import logging
from framework import users
from framework import basehandlers
from internals import models
from framework import ramcache
import settings
CACHE_AGE = 86400 # 24hrs
def _truncate_day_percentage(datapoint):
# Need 8 decimals b/c num will by multiplied by 100 to get a percentage and
# we want 6 decimals.
datapoint.day_percentage = float("%.*f" % (8, datapoint.day_percentage))
return datapoint
def _is_googler(user):
return user and user.email().endswith('@google.com')
def _clean_data(data):
user = users.get_current_user()
# Don't show raw percentages if user is not a googler.
if not _is_googler(user):
data = list(map(_truncate_day_percentage, data))
return data
def _filter_metric_data(data, formatted=False):
"""Filter out unneeded metric data befor sending."""
data = _clean_data(data)
if not formatted:
data = [entity.to_dict() for entity in data]
# Remove keys that the frontend doesn't render.
for item in data:
item.pop('rolling_percentage', None)
item.pop('updated', None)
item.pop('created', None)
return data
class TimelineHandler(basehandlers.FlaskHandler):
HTTP_CACHE_TYPE = 'private'
JSONIFY = True
def make_query(self, bucket_id):
query = self.MODEL_CLASS.query()
query = query.filter(self.MODEL_CLASS.bucket_id == bucket_id)
# The switch to new UMA data changed the semantics of the CSS animated
# properties. Since showing the historical data alongside the new data
# does not make sense, filter out everything before the 2017-10-26 switch.
# See https://github.com/GoogleChrome/chromium-dashboard/issues/414
if self.MODEL_CLASS == models.AnimatedProperty:
query = query.filter(
self.MODEL_CLASS.date >= datetime.datetime(2017, 10, 26))
return query
def get_template_data(self):
try:
bucket_id = int(self.request.args.get('bucket_id'))
except:
# TODO(jrobbins): Why return [] instead of 400?
return []
cache_key = '%s|%s' % (self.CACHE_KEY, bucket_id)
datapoints = ramcache.get(cache_key)
if not datapoints:
query = self.make_query(bucket_id)
query = query.order(self.MODEL_CLASS.date)
datapoints = query.fetch(None) # All matching results.
# Remove outliers if percentage is not between 0-1.
#datapoints = filter(lambda x: 0 <= x.day_percentage <= 1, datapoints)
ramcache.set(cache_key, datapoints, time=CACHE_AGE)
return _filter_metric_data(datapoints)
class PopularityTimelineHandler(TimelineHandler):
CACHE_KEY = 'css_pop_timeline'
MODEL_CLASS = models.StableInstance
def get_template_data(self):
return super(PopularityTimelineHandler, self).get_template_data()
class AnimatedTimelineHandler(TimelineHandler):
CACHE_KEY = 'css_animated_timeline'
MODEL_CLASS = models.AnimatedProperty
def get_template_data(self):
return super(AnimatedTimelineHandler, self).get_template_data()
class FeatureObserverTimelineHandler(TimelineHandler):
CACHE_KEY = 'featureob_timeline'
MODEL_CLASS = models.FeatureObserver
def get_template_data(self):
return super(FeatureObserverTimelineHandler, self).get_template_data()
class FeatureHandler(basehandlers.FlaskHandler):
HTTP_CACHE_TYPE = 'private'
JSONIFY = True
def __query_metrics_for_properties(self):
datapoints = []
buckets_future = self.PROPERTY_CLASS.query().fetch_async(None)
# First, grab a bunch of recent datapoints in a batch.
# That operation is fast and makes most of the iterations
# of the main loop become in-RAM operations.
batch_datapoints_query = self.MODEL_CLASS.query()
batch_datapoints_query = batch_datapoints_query.order(
-self.MODEL_CLASS.date)
batch_datapoints_list = batch_datapoints_query.fetch(5000)
logging.info('batch query found %r recent datapoints',
len(batch_datapoints_list))
batch_datapoints_dict = {}
for dp in batch_datapoints_list:
if dp.bucket_id not in batch_datapoints_dict:
batch_datapoints_dict[dp.bucket_id] = dp
logging.info('batch query found datapoints for %r buckets',
len(batch_datapoints_dict))
# For every css property, fetch latest day_percentage.
buckets = buckets_future.get_result()
futures = []
for b in buckets:
if b.bucket_id in batch_datapoints_dict:
datapoints.append(batch_datapoints_dict[b.bucket_id])
else:
query = self.MODEL_CLASS.query()
query = query.filter(self.MODEL_CLASS.bucket_id == b.bucket_id)
query = query.order(-self.MODEL_CLASS.date)
futures.append(query.get_async())
for f in futures:
last_result = f.result()
if last_result:
datapoints.append(last_result)
# Sort list by percentage. Highest first.
datapoints.sort(key=lambda x: x.day_percentage, reverse=True)
return datapoints
def get_template_data(self):
if self.MODEL_CLASS == models.FeatureObserver:
properties = ramcache.get(self.CACHE_KEY)
if not properties or self.request.args.get('refresh'):
properties = self.__query_metrics_for_properties()
ramcache.set(self.CACHE_KEY, properties, time=CACHE_AGE)
else:
properties = ramcache.get(self.CACHE_KEY)
logging.info(
'looked at cache %r and found %s', self.CACHE_KEY,
repr(properties)[:settings.MAX_LOG_LINE])
if properties is None:
logging.info('Loading properties from datastore')
properties = self.__query_metrics_for_properties()
ramcache.set(self.CACHE_KEY, properties, time=CACHE_AGE)
logging.info('before filtering: %s',
repr(properties)[:settings.MAX_LOG_LINE])
return _filter_metric_data(properties)
class CSSPopularityHandler(FeatureHandler):
CACHE_KEY = 'css_popularity'
MODEL_CLASS = models.StableInstance
PROPERTY_CLASS = models.CssPropertyHistogram
def get_template_data(self):
return super(CSSPopularityHandler, self).get_template_data()
class CSSAnimatedHandler(FeatureHandler):
CACHE_KEY = 'css_animated'
MODEL_CLASS = models.AnimatedProperty
PROPERTY_CLASS = models.CssPropertyHistogram
def get_template_data(self):
return super(CSSAnimatedHandler, self).get_template_data()
class FeatureObserverPopularityHandler(FeatureHandler):
CACHE_KEY = 'featureob_popularity'
MODEL_CLASS = models.FeatureObserver
PROPERTY_CLASS = models.FeatureObserverHistogram
def get_template_data(self):
return super(FeatureObserverPopularityHandler, self).get_template_data()
# TODO(jrobbins): Is this ever called? I don't see what calls it.
# And, I don't see recent requests for it in the server logs.
# The CL that added it only added this class, no caller.
class FeatureBucketsHandler(basehandlers.FlaskHandler):
JSONIFY = True
def get_template_data(self, prop_type):
if prop_type == 'cssprops':
properties = sorted(
models.CssPropertyHistogram.get_all().items(), key=lambda x:x[1])
else:
properties = sorted(
models.FeatureObserverHistogram.get_all().items(), key=lambda x:x[1])
return properties