2010-09-21 16:31:26 -07:00
|
|
|
from django.db.models import Avg, Count, Max, Min, StdDev
|
|
|
|
|
|
|
|
from main.utils import cache_function
|
|
|
|
from .models import MirrorLog, MirrorProtocol, MirrorUrl
|
|
|
|
|
|
|
|
import datetime
|
|
|
|
|
2010-09-23 08:33:32 -07:00
|
|
|
default_cutoff = datetime.timedelta(hours=24)
|
2010-09-21 16:31:26 -07:00
|
|
|
|
2011-04-18 13:10:20 -07:00
|
|
|
def annotate_url(url, delays):
|
|
|
|
'''Given a MirrorURL object, add a few more attributes to it regarding
|
|
|
|
status, including completion_pct, delay, and score.'''
|
|
|
|
url.completion_pct = float(url.success_count) / url.check_count
|
|
|
|
if url.id in delays:
|
|
|
|
url_delays = delays[url.id]
|
|
|
|
url.delay = sum(url_delays, datetime.timedelta()) / len(url_delays)
|
|
|
|
hours = url.delay.days * 24.0 + url.delay.seconds / 3600.0
|
|
|
|
|
|
|
|
if url.completion_pct > 0:
|
|
|
|
divisor = url.completion_pct
|
|
|
|
else:
|
|
|
|
# arbitrary small value
|
|
|
|
divisor = 0.005
|
|
|
|
url.score = (hours + url.duration_avg + url.duration_stddev) / divisor
|
|
|
|
else:
|
|
|
|
url.delay = None
|
|
|
|
url.score = None
|
|
|
|
|
2012-01-05 11:03:00 -08:00
|
|
|
@cache_function(123)
|
2010-09-23 08:33:32 -07:00
|
|
|
def get_mirror_statuses(cutoff=default_cutoff):
|
|
|
|
cutoff_time = datetime.datetime.utcnow() - cutoff
|
2010-09-30 12:32:54 -07:00
|
|
|
protocols = list(MirrorProtocol.objects.filter(is_download=True))
|
2010-09-21 16:31:26 -07:00
|
|
|
# I swear, this actually has decent performance...
|
2010-09-24 11:26:08 -07:00
|
|
|
urls = MirrorUrl.objects.select_related('mirror', 'protocol').filter(
|
2010-09-21 16:31:26 -07:00
|
|
|
mirror__active=True, mirror__public=True,
|
2010-09-24 11:26:08 -07:00
|
|
|
protocol__in=protocols,
|
2010-09-21 16:31:26 -07:00
|
|
|
logs__check_time__gte=cutoff_time).annotate(
|
2010-09-30 10:47:30 -07:00
|
|
|
check_count=Count('logs'),
|
|
|
|
success_count=Count('logs__duration'),
|
|
|
|
last_sync=Max('logs__last_sync'),
|
2010-09-21 16:31:26 -07:00
|
|
|
last_check=Max('logs__check_time'),
|
2010-09-22 11:28:12 -07:00
|
|
|
duration_avg=Avg('logs__duration'),
|
2011-12-11 17:43:24 -08:00
|
|
|
duration_stddev=StdDev('logs__duration')
|
2010-09-21 16:31:26 -07:00
|
|
|
).order_by('-last_sync', '-duration_avg')
|
|
|
|
|
2010-09-22 11:28:12 -07:00
|
|
|
# The Django ORM makes it really hard to get actual average delay in the
|
|
|
|
# above query, so run a seperate query for it and we will process the
|
|
|
|
# results here.
|
|
|
|
times = MirrorLog.objects.filter(is_success=True, last_sync__isnull=False,
|
|
|
|
check_time__gte=cutoff_time)
|
|
|
|
delays = {}
|
|
|
|
for log in times:
|
2011-04-18 13:10:20 -07:00
|
|
|
delay = log.check_time - log.last_sync
|
|
|
|
delays.setdefault(log.url_id, []).append(delay)
|
2010-09-22 11:28:12 -07:00
|
|
|
|
2010-09-23 08:33:32 -07:00
|
|
|
if urls:
|
|
|
|
last_check = max([u.last_check for u in urls])
|
|
|
|
num_checks = max([u.check_count for u in urls])
|
|
|
|
check_info = MirrorLog.objects.filter(
|
|
|
|
check_time__gte=cutoff_time).aggregate(
|
|
|
|
mn=Min('check_time'), mx=Max('check_time'))
|
2010-10-01 16:08:54 -07:00
|
|
|
if num_checks > 1:
|
|
|
|
check_frequency = (check_info['mx'] - check_info['mn']) \
|
|
|
|
/ (num_checks - 1)
|
|
|
|
else:
|
2011-04-18 13:10:20 -07:00
|
|
|
check_frequency = None
|
2010-09-23 08:33:32 -07:00
|
|
|
else:
|
|
|
|
last_check = None
|
|
|
|
num_checks = 0
|
|
|
|
check_frequency = None
|
|
|
|
|
2010-09-30 10:47:30 -07:00
|
|
|
for url in urls:
|
2011-04-18 13:10:20 -07:00
|
|
|
annotate_url(url, delays)
|
2010-09-30 10:47:30 -07:00
|
|
|
|
2010-09-23 08:33:32 -07:00
|
|
|
return {
|
2010-09-30 10:47:30 -07:00
|
|
|
'cutoff': cutoff,
|
2010-09-23 08:33:32 -07:00
|
|
|
'last_check': last_check,
|
|
|
|
'num_checks': num_checks,
|
|
|
|
'check_frequency': check_frequency,
|
|
|
|
'urls': urls,
|
|
|
|
}
|
2010-09-21 16:31:26 -07:00
|
|
|
|
2012-01-05 11:03:00 -08:00
|
|
|
@cache_function(117)
|
2010-09-23 08:33:32 -07:00
|
|
|
def get_mirror_errors(cutoff=default_cutoff):
|
|
|
|
cutoff_time = datetime.datetime.utcnow() - cutoff
|
2010-09-21 16:31:26 -07:00
|
|
|
errors = MirrorLog.objects.filter(
|
2010-09-24 11:26:08 -07:00
|
|
|
is_success=False, check_time__gte=cutoff_time,
|
|
|
|
url__mirror__active=True, url__mirror__public=True).values(
|
2011-04-12 16:36:20 -07:00
|
|
|
'url__url', 'url__country', 'url__protocol__protocol',
|
|
|
|
'url__mirror__country', 'error').annotate(
|
2010-09-21 16:31:26 -07:00
|
|
|
error_count=Count('error'), last_occurred=Max('check_time')
|
|
|
|
).order_by('-last_occurred', '-error_count')
|
2011-04-12 16:36:20 -07:00
|
|
|
errors = list(errors)
|
|
|
|
for err in errors:
|
|
|
|
err['country'] = err['url__country'] or err['url__mirror__country']
|
|
|
|
return errors
|
2010-09-21 16:31:26 -07:00
|
|
|
|
|
|
|
# vim: set ts=4 sw=4 et:
|