Skip to content

Commit

Permalink
Optimize and fix the /insights page (#3007)
Browse files Browse the repository at this point in the history
* Fix #2980: Prevent bots from checking the /insights page
* Optimize ProjectLocaleInsightsSnapshot Admin view/editing page
* Refactor data gathering for the /insights page

1. Fix #2979: Optimize /insights page.

To render the charts on the Insights pages, we use periodically gathered ProjectLocaleInsightsSnapshot data. That works fine on Project, Locale and
ProjectLocale pages, but not on the /insights page which shows data across the entire app. The amount of data requested from the DB quickly becomes big and the request starts timing out.

In this patch, we gather data directly from the ActionLog as hinted at in #2938.

2. Fix #2999: Show insights for all months.

3. Calculate monthly averages rather than averages of averages.
  • Loading branch information
mathjazz authored Nov 9, 2023
1 parent 59211dd commit 549cd93
Show file tree
Hide file tree
Showing 4 changed files with 66 additions and 33 deletions.
1 change: 1 addition & 0 deletions pontoon/base/templates/robots.txt
Original file line number Diff line number Diff line change
Expand Up @@ -2,3 +2,4 @@ User-agent: *
Disallow: /a/
Disallow: /admin/
Disallow: /contributors/
Disallow: /*insights/
1 change: 1 addition & 0 deletions pontoon/insights/admin.py
Original file line number Diff line number Diff line change
Expand Up @@ -52,6 +52,7 @@ class ProjectLocaleInsightsSnapshotAdmin(admin.ModelAdmin):
"completion",
"unreviewed_strings",
)
readonly_fields = ("project_locale",)


admin.site.register(LocaleInsightsSnapshot, LocaleInsightsSnapshotAdmin)
Expand Down
95 changes: 63 additions & 32 deletions pontoon/insights/utils.py
Original file line number Diff line number Diff line change
@@ -1,11 +1,12 @@
import json
import statistics

from datetime import datetime, timedelta
from dateutil.relativedelta import relativedelta
from django.contrib.auth.models import User
from django.db.models.functions import TruncMonth
from django.db.models import Avg, Count, Q, Sum

from pontoon.actionlog.models import ActionLog
from pontoon.base.utils import convert_to_unix_time
from pontoon.insights.models import (
LocaleInsightsSnapshot,
Expand Down Expand Up @@ -365,25 +366,43 @@ def get_insights(locale=None, project=None):

def get_global_pretranslation_quality(category, id):
start_date = get_insight_start_date()
snapshots = ProjectLocaleInsightsSnapshot.objects.filter(
created_at__gte=start_date,
project_locale__pretranslation_enabled=True,
)

insights = (
snapshots
sync_user = User.objects.get(email="[email protected]").pk

pretranslation_users = User.objects.filter(
email__in=[
"[email protected]",
"[email protected]",
]
).values_list("pk", flat=True)

actions = (
ActionLog.objects.filter(
created_at__gte=start_date,
action_type__in=["translation:approved", "translation:rejected"],
translation__user__in=pretranslation_users,
)
.exclude(performed_by=sync_user)
# Truncate to month and add to select list
.annotate(month=TruncMonth("created_at"))
# Group By month and locale
.values("month", f"project_locale__{category}")
# Select the avg/sum of the grouping
.annotate(pretranslations_approved_sum=Sum("pretranslations_approved"))
.annotate(pretranslations_rejected_sum=Sum("pretranslations_rejected"))
.values("month", f"translation__{category}")
# Select the sum of the grouping
.annotate(
pretranslations_approved_sum=Count(
"id", filter=Q(action_type="translation:approved")
)
)
.annotate(
pretranslations_rejected_sum=Count(
"id", filter=Q(action_type="translation:rejected")
)
)
# Select month and values
.values(
"month",
f"project_locale__{category}__{id}",
f"project_locale__{category}__name",
f"translation__{category}__{id}",
f"translation__{category}__name",
"pretranslations_approved_sum",
"pretranslations_rejected_sum",
)
Expand All @@ -393,13 +412,27 @@ def get_global_pretranslation_quality(category, id):
data = {
"all": {
"name": "All",
"approval_rate": [],
"approval_rate": [None] * 12,
}
}

for insight in insights:
key = insight[f"project_locale__{category}__{id}"]
name = insight[f"project_locale__{category}__name"]
approved = "pretranslations_approved_sum"
rejected = "pretranslations_rejected_sum"

totals = [
{
approved: 0,
rejected: 0,
}
for x in range(0, 12)
]

for action in actions:
key = action[f"translation__{category}__{id}"]
name = action[f"translation__{category}__name"]
month_index = relativedelta(
action["month"].replace(tzinfo=None), start_date
).months

if category == "locale":
name = f"{name} · {key}"
Expand All @@ -408,24 +441,22 @@ def get_global_pretranslation_quality(category, id):
key,
{
"name": name,
"approval_rate": [],
"approval_rate": [None] * 12,
},
)

item["approval_rate"].append(get_approval_rate(insight))

# Monthly total across the entire category
category_approval_rates = [value["approval_rate"] for value in data.values()]

for month in zip(*category_approval_rates[1:]):
not_none = [x for x in month if x is not None]
if not_none:
total = statistics.mean(not_none)
else:
total = None
data["all"]["approval_rate"].append(total)
item["approval_rate"][month_index] = get_approval_rate(action)
totals[month_index][approved] += action[approved]
totals[month_index][rejected] += action[rejected]

# Monthly totals across the entire category
total_approval_rates = data["all"]["approval_rate"]
for idx, _ in enumerate(total_approval_rates):
total_approval_rates[idx] = get_approval_rate(totals[idx])
total_approval_rates = [
get_approval_rate(totals[idx]) for idx, _ in enumerate(total_approval_rates)
]

return {
"dates": list({convert_to_unix_time(x["month"]) for x in insights}),
"dates": list({convert_to_unix_time(x["month"]) for x in actions}),
"dataset": json.dumps([v for _, v in data.items()]),
}
2 changes: 1 addition & 1 deletion pontoon/insights/views.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@ def insights(request):
"locale", "code"
),
"project_pretranslation_quality": get_global_pretranslation_quality(
"project", "slug"
"entity__resource__project", "slug"
),
},
)

0 comments on commit 549cd93

Please sign in to comment.