perf: improved campaigns suggestion perfomance by caching some things
This commit is contained in:
@@ -2,7 +2,7 @@ import json
|
||||
import uuid
|
||||
from http import HTTPStatus as status
|
||||
|
||||
from django.test import TestCase, Client
|
||||
from django.test import TestCase, Client, override_settings
|
||||
from apps.advertiser.models import Advertiser
|
||||
from apps.client.models import Client as ClientModel
|
||||
from apps.mlscore.models import Mlscore
|
||||
@@ -21,6 +21,13 @@ class TestMlscoreEndpoint(TestCase):
|
||||
|
||||
self.url = "/ml-scores"
|
||||
|
||||
@override_settings(
|
||||
CACHES={
|
||||
"default": {
|
||||
"BACKEND": "django.core.cache.backends.locmem.LocMemCache",
|
||||
}
|
||||
}
|
||||
)
|
||||
def test_create_mlscore_success(self):
|
||||
data = {
|
||||
"advertiser_id": str(self.advertiser.id),
|
||||
@@ -35,6 +42,13 @@ class TestMlscoreEndpoint(TestCase):
|
||||
self.assertEqual(response.status_code, status.OK)
|
||||
self.assertEqual(mlscore.score, 90)
|
||||
|
||||
@override_settings(
|
||||
CACHES={
|
||||
"default": {
|
||||
"BACKEND": "django.core.cache.backends.locmem.LocMemCache",
|
||||
}
|
||||
}
|
||||
)
|
||||
def test_update_mlscore_success(self):
|
||||
mlscore = Mlscore.objects.create(
|
||||
advertiser=self.advertiser,
|
||||
@@ -74,6 +88,13 @@ class TestMlscoreEndpoint(TestCase):
|
||||
|
||||
self.assertEqual(response.status_code, status.BAD_REQUEST)
|
||||
|
||||
@override_settings(
|
||||
CACHES={
|
||||
"default": {
|
||||
"BACKEND": "django.core.cache.backends.locmem.LocMemCache",
|
||||
}
|
||||
}
|
||||
)
|
||||
def test_non_existing_client(self):
|
||||
data = {
|
||||
"advertiser_id": str(self.advertiser.id),
|
||||
|
||||
@@ -0,0 +1,35 @@
|
||||
from typing import Any
|
||||
|
||||
from django.core.management.base import BaseCommand
|
||||
|
||||
from apps.campaign.models import Campaign
|
||||
from apps.mlscore.models import Mlscore
|
||||
|
||||
|
||||
class Command(BaseCommand):
|
||||
help = (
|
||||
"Initialize cache with current counts of "
|
||||
"impressions, clicks, and ML scores."
|
||||
)
|
||||
|
||||
def handle(self, *args: Any, **kwargs: Any) -> None:
|
||||
for campaign in Campaign.objects.all():
|
||||
campaign.setup_cache()
|
||||
self.stdout.write(
|
||||
self.style.SUCCESS(
|
||||
f"Initialized cache for Campaign {campaign.id}: "
|
||||
f"{campaign.impressions_count} impressions, "
|
||||
f"{campaign.clicks_count} clicks."
|
||||
)
|
||||
)
|
||||
|
||||
for mlscore in Mlscore.objects.all():
|
||||
mlscore.setup_cache()
|
||||
self.stdout.write(
|
||||
self.style.SUCCESS(
|
||||
f"Initialized cache for MLscore: "
|
||||
f"Client {mlscore.client_id}, "
|
||||
f"Advertiser {mlscore.advertiser_id}, "
|
||||
f"Score {mlscore.score}."
|
||||
)
|
||||
)
|
||||
@@ -1,8 +1,10 @@
|
||||
import contextlib
|
||||
import random
|
||||
from decimal import ROUND_HALF_UP, Decimal
|
||||
from logging import Logger
|
||||
from typing import Any, Self
|
||||
from uuid import UUID
|
||||
|
||||
from django.conf import settings
|
||||
from django.core.cache import cache
|
||||
from django.core.exceptions import ValidationError
|
||||
from django.core.validators import (
|
||||
@@ -22,9 +24,10 @@ from apps.campaign.validators import (
|
||||
)
|
||||
from apps.client.models import Client
|
||||
from apps.core.models import BaseModel
|
||||
from apps.mlscore.models import Mlscore
|
||||
from config.errors import ConflictError, ForbiddenError
|
||||
|
||||
logger: Logger = settings.LOGGER
|
||||
|
||||
|
||||
class Campaign(BaseModel):
|
||||
class GenderChoices(models.TextChoices):
|
||||
@@ -113,6 +116,24 @@ class Campaign(BaseModel):
|
||||
if self.start_date < current_date:
|
||||
raise ValidationError(err) from None
|
||||
|
||||
def save(self, *args: Any, **kwargs: Any) -> None:
|
||||
created = self.pk is None
|
||||
|
||||
super().save(*args, **kwargs)
|
||||
|
||||
if created:
|
||||
self.setup_cache()
|
||||
|
||||
def setup_cache(self) -> None:
|
||||
cache.add(
|
||||
f"campaign_{self.id}_impressions_count", self.impressions.count()
|
||||
)
|
||||
cache.add(f"campaign_{self.id}_clicks_count", self.clicks.count())
|
||||
cache.set(
|
||||
f"campaign_{self.id}_impressions_count", self.impressions.count()
|
||||
)
|
||||
cache.set(f"campaign_{self.id}_clicks_count", self.clicks.count())
|
||||
|
||||
@property
|
||||
def ad_id(self) -> UUID:
|
||||
return self.id
|
||||
@@ -138,32 +159,54 @@ class Campaign(BaseModel):
|
||||
and cache.get("current_date", default=0) <= self.end_date
|
||||
)
|
||||
|
||||
@property
|
||||
def impressions_count(self) -> int:
|
||||
return cache.get(f"campaign_{self.id}_impressions_count", 0)
|
||||
|
||||
@property
|
||||
def clicks_count(self) -> int:
|
||||
return cache.get(f"campaign_{self.id}_clicks_count", 0)
|
||||
|
||||
def view(self, client: Client) -> None:
|
||||
with contextlib.suppress(ConflictError):
|
||||
try:
|
||||
CampaignImpression.objects.create(
|
||||
campaign=self,
|
||||
client=client,
|
||||
campaign_id=self.id,
|
||||
client_id=client.id,
|
||||
price=self.cost_per_impression,
|
||||
date=cache.get("current_date", default=0),
|
||||
)
|
||||
try:
|
||||
cache.incr(f"campaign_{self.id}_impressions_count", 1)
|
||||
except ValueError:
|
||||
self.setup_cache()
|
||||
logger.warning(
|
||||
"Seems that %s missing caches", self.campaign_id
|
||||
)
|
||||
except ConflictError:
|
||||
pass
|
||||
|
||||
def click(self, client: Client) -> None:
|
||||
if not self.active:
|
||||
err = "Can't click on inactive campaign."
|
||||
raise ForbiddenError(err)
|
||||
|
||||
try:
|
||||
CampaignImpression.objects.get(campaign=self, client=client)
|
||||
except CampaignImpression.DoesNotExist:
|
||||
raise ForbiddenError from None
|
||||
|
||||
with contextlib.suppress(ConflictError):
|
||||
try:
|
||||
CampaignClick.objects.create(
|
||||
campaign=self,
|
||||
client=client,
|
||||
campaign_id=self.id,
|
||||
client_id=client.id,
|
||||
price=self.cost_per_click,
|
||||
date=cache.get("current_date", default=0),
|
||||
)
|
||||
try:
|
||||
cache.incr(f"campaign_{self.id}_clicks_count", 1)
|
||||
except ValueError:
|
||||
self.setup_cache()
|
||||
logger.warning(
|
||||
"Seems that %s missing caches", self.campaign_id
|
||||
)
|
||||
except ConflictError:
|
||||
pass
|
||||
|
||||
def get_statistics(self) -> dict[str, Any]:
|
||||
impressions = self.impressions.aggregate(
|
||||
@@ -278,69 +321,69 @@ class Campaign(BaseModel):
|
||||
| models.Q(age_from__isnull=True)
|
||||
) & (models.Q(age_to__gte=client.age) | models.Q(age_to__isnull=True))
|
||||
|
||||
return (
|
||||
cls.objects.filter(
|
||||
date_filter,
|
||||
location_filter,
|
||||
gender_filter,
|
||||
age_filter,
|
||||
)
|
||||
.select_related("advertiser")
|
||||
.prefetch_related("clicks", "impressions", "advertiser__mlscores")
|
||||
return cls.objects.filter(
|
||||
date_filter,
|
||||
location_filter,
|
||||
gender_filter,
|
||||
age_filter,
|
||||
).only(
|
||||
Campaign.id.field.name,
|
||||
Campaign.advertiser_id.field.name,
|
||||
Campaign.impressions_limit.field.name,
|
||||
Campaign.clicks_limit.field.name,
|
||||
Campaign.cost_per_impression.field.name,
|
||||
Campaign.cost_per_click.field.name,
|
||||
)
|
||||
|
||||
@classmethod
|
||||
def suggest(cls, client: Client) -> Self:
|
||||
base_campaigns = cls.get_available_campaigns(client)
|
||||
if not base_campaigns or base_campaigns == []:
|
||||
campaigns = cls.get_available_campaigns(client)
|
||||
if not campaigns or campaigns == []:
|
||||
return None
|
||||
|
||||
advertiser_ids = list({c.advertiser_id for c in base_campaigns})
|
||||
ml_scores = Mlscore.objects.filter(
|
||||
client=client, advertiser_id__in=advertiser_ids
|
||||
).values("advertiser_id", "score")
|
||||
ml_dict = {m["advertiser_id"]: m["score"] for m in ml_scores}
|
||||
|
||||
campaigns = list(
|
||||
base_campaigns.annotate(
|
||||
impressions_count=models.Count("impressions"),
|
||||
clicks_count=models.Count("clicks"),
|
||||
)
|
||||
)
|
||||
campaign_ids = [c.id for c in campaigns]
|
||||
|
||||
client_impressions = set(
|
||||
CampaignImpression.objects.filter(
|
||||
client=client, campaign_id__in=campaign_ids
|
||||
).values_list("campaign_id", flat=True)
|
||||
)
|
||||
client_clicks = set(
|
||||
CampaignClick.objects.filter(
|
||||
client=client, campaign_id__in=campaign_ids
|
||||
).values_list("campaign_id", flat=True)
|
||||
)
|
||||
client_impressions = CampaignImpression.objects.filter(
|
||||
client=client, campaign_id__in=campaign_ids
|
||||
).values_list("campaign_id", flat=True)
|
||||
client_clicks = CampaignClick.objects.filter(
|
||||
client=client, campaign_id__in=campaign_ids
|
||||
).values_list("campaign_id", flat=True)
|
||||
|
||||
prioritized = []
|
||||
ml_values = []
|
||||
profit_values = []
|
||||
exceed_impressions_chance = ( # oh, can i just skip commenting this?
|
||||
*(0 for i in range(4)),
|
||||
*(1 for i in range(1)),
|
||||
)
|
||||
|
||||
for campaign in campaigns:
|
||||
if campaign.impressions_count >= campaign.impressions_limit:
|
||||
continue
|
||||
|
||||
ml_score = ml_dict.get(campaign.advertiser_id, 0)
|
||||
ml_values.append(ml_score)
|
||||
|
||||
has_impression = campaign.id in client_impressions
|
||||
has_click = campaign.id in client_clicks
|
||||
|
||||
if not has_impression:
|
||||
allow_exceed_impressions = random.choice(
|
||||
exceed_impressions_chance
|
||||
)
|
||||
impressions_limit = round(
|
||||
campaign.impressions_limit
|
||||
+ campaign.impressions_limit
|
||||
* 0.01
|
||||
* allow_exceed_impressions
|
||||
)
|
||||
if campaign.impressions_count >= impressions_limit:
|
||||
continue
|
||||
|
||||
ml_score = cache.get(
|
||||
f"mlscore_{client.id}_{campaign.advertiser_id}", 0
|
||||
)
|
||||
ml_values.append(ml_score)
|
||||
|
||||
if has_impression:
|
||||
profit = campaign.cost_per_click if not has_click else 0
|
||||
else:
|
||||
profit = campaign.cost_per_impression + campaign.cost_per_click
|
||||
print(profit)
|
||||
if profit <= 0:
|
||||
continue
|
||||
|
||||
profit_values.append(profit)
|
||||
|
||||
@@ -364,28 +407,43 @@ class Campaign(BaseModel):
|
||||
)
|
||||
)
|
||||
|
||||
max_ml = max(ml_values) if ml_values else 1
|
||||
max_profit = max(profit_values) if profit_values else 1
|
||||
min_profit = min(profit_values) if profit_values else 0
|
||||
if not ml_values or not profit_values:
|
||||
return None
|
||||
|
||||
max_ml = max(ml_values)
|
||||
max_profit = max(profit_values)
|
||||
min_profit = min(profit_values)
|
||||
profit_range = (
|
||||
max_profit - min_profit if max_profit != min_profit else 1
|
||||
)
|
||||
|
||||
print(prioritized, max_ml, max_profit, min_profit, profit_range)
|
||||
|
||||
final_list = []
|
||||
for campaign, metrics in prioritized:
|
||||
norm_profit = (metrics["profit"] - min_profit) / profit_range
|
||||
norm_ml = metrics["ml"] / max_ml if max_ml > 0 else 0
|
||||
|
||||
priority = (
|
||||
0.5 * norm_profit + 0.25 * norm_ml + 0.15 * metrics["capacity"]
|
||||
0.7 * norm_profit + 0.2 * norm_ml + 0.1 * metrics["capacity"]
|
||||
)
|
||||
|
||||
final_list.append((campaign, priority))
|
||||
|
||||
final_list.sort(key=lambda x: -x[1])
|
||||
return final_list[0][0] if len(final_list) >= 1 else None
|
||||
|
||||
if len(final_list) != 0:
|
||||
campaign = final_list[0][0]
|
||||
|
||||
return Campaign.objects.only(
|
||||
Campaign.id.field.name,
|
||||
Campaign.advertiser_id.field.name,
|
||||
Campaign.ad_title.field.name,
|
||||
Campaign.ad_text.field.name,
|
||||
Campaign.ad_image.field.name,
|
||||
Campaign.cost_per_impression.field.name,
|
||||
Campaign.cost_per_click.field.name,
|
||||
).get(id=campaign.id)
|
||||
|
||||
return None
|
||||
|
||||
|
||||
class CampaignImpression(BaseModel):
|
||||
|
||||
@@ -1,3 +1,6 @@
|
||||
from typing import Any
|
||||
|
||||
from django.core.cache import cache
|
||||
from django.db import models
|
||||
|
||||
from apps.advertiser.models import Advertiser
|
||||
@@ -21,6 +24,15 @@ class Mlscore(BaseModel):
|
||||
def __str__(self) -> str:
|
||||
return f"{self.advertiser.name} | {self.client.login}"
|
||||
|
||||
def save(self, *args: Any, **kwargs: Any) -> None:
|
||||
super().save(*args, **kwargs)
|
||||
|
||||
self.setup_cache()
|
||||
|
||||
def setup_cache(self) -> None:
|
||||
cache.add(f"mlscore_{self.client_id}_{self.advertiser_id}", self.score)
|
||||
cache.set(f"mlscore_{self.client_id}_{self.advertiser_id}", self.score)
|
||||
|
||||
class Meta:
|
||||
unique_together = (
|
||||
"advertiser",
|
||||
|
||||
@@ -1,5 +1,4 @@
|
||||
from django.test import TestCase
|
||||
from django.db.utils import IntegrityError
|
||||
from django.test import TestCase, override_settings
|
||||
from django.core.exceptions import ValidationError
|
||||
from config.errors import ConflictError
|
||||
from apps.advertiser.models import Advertiser
|
||||
@@ -17,6 +16,13 @@ class MlscoreModelTest(TestCase):
|
||||
gender=Client.GenderChoices.MALE,
|
||||
)
|
||||
|
||||
@override_settings(
|
||||
CACHES={
|
||||
"default": {
|
||||
"BACKEND": "django.core.cache.backends.locmem.LocMemCache",
|
||||
}
|
||||
}
|
||||
)
|
||||
def test_create_mlscore(self):
|
||||
mlscore = Mlscore.objects.create(
|
||||
advertiser=self.advertiser,
|
||||
@@ -27,6 +33,13 @@ class MlscoreModelTest(TestCase):
|
||||
self.assertEqual(mlscore.score, 95)
|
||||
self.assertEqual(str(mlscore), "Test Advertiser | test_client")
|
||||
|
||||
@override_settings(
|
||||
CACHES={
|
||||
"default": {
|
||||
"BACKEND": "django.core.cache.backends.locmem.LocMemCache",
|
||||
}
|
||||
}
|
||||
)
|
||||
def test_mlscore_unique_together_constraint(self):
|
||||
Mlscore.objects.create(
|
||||
advertiser=self.advertiser,
|
||||
@@ -41,6 +54,13 @@ class MlscoreModelTest(TestCase):
|
||||
score=85,
|
||||
)
|
||||
|
||||
@override_settings(
|
||||
CACHES={
|
||||
"default": {
|
||||
"BACKEND": "django.core.cache.backends.locmem.LocMemCache",
|
||||
}
|
||||
}
|
||||
)
|
||||
def test_delete_advertiser_cascades(self):
|
||||
mlscore = Mlscore.objects.create(
|
||||
advertiser=self.advertiser,
|
||||
@@ -51,6 +71,13 @@ class MlscoreModelTest(TestCase):
|
||||
|
||||
self.assertFalse(Mlscore.objects.filter(id=mlscore.id).exists())
|
||||
|
||||
@override_settings(
|
||||
CACHES={
|
||||
"default": {
|
||||
"BACKEND": "django.core.cache.backends.locmem.LocMemCache",
|
||||
}
|
||||
}
|
||||
)
|
||||
def test_delete_client_cascades(self):
|
||||
mlscore = Mlscore.objects.create(
|
||||
advertiser=self.advertiser,
|
||||
|
||||
@@ -122,6 +122,7 @@ ignore = [
|
||||
"PT009",
|
||||
"PT027",
|
||||
"RUF001",
|
||||
"S311",
|
||||
]
|
||||
logger-objects = []
|
||||
per-file-ignores = {}
|
||||
|
||||
@@ -9,3 +9,5 @@ fi
|
||||
if [ "$DJANGO_CREATE_SUPERUSER" = "True" ]; then
|
||||
python manage.py createsuperuser --noinput --username "$DJANGO_SUPERUSER_USERNAME" --email "$DJANGO_SUPERUSER_EMAIL" || true
|
||||
fi
|
||||
|
||||
python manage.py init_cache
|
||||
|
||||
Reference in New Issue
Block a user