2023-11-19 19:45:19 +01:00
|
|
|
from datetime import datetime, timedelta
|
2022-03-12 13:33:15 +01:00
|
|
|
|
|
|
|
from django.db.models import Sum
|
|
|
|
from django.utils.timezone import now as timezone_now
|
|
|
|
|
|
|
|
from analytics.lib.counts import COUNT_STATS
|
|
|
|
from analytics.models import StreamCount
|
2023-08-07 16:47:48 +02:00
|
|
|
from zerver.models import Realm
|
2022-03-12 13:33:15 +01:00
|
|
|
|
|
|
|
|
2024-07-12 02:30:23 +02:00
|
|
|
def get_streams_traffic(stream_ids: set[int], realm: Realm) -> dict[int, int] | None:
|
2023-11-30 21:05:34 +01:00
|
|
|
if realm.is_zephyr_mirror_realm:
|
2023-08-07 16:47:48 +02:00
|
|
|
# We do not need traffic data for streams in zephyr mirroring realm.
|
|
|
|
return None
|
|
|
|
|
2022-03-12 13:33:15 +01:00
|
|
|
stat = COUNT_STATS["messages_in_stream:is_bot:day"]
|
2023-11-19 19:45:19 +01:00
|
|
|
traffic_from = timezone_now() - timedelta(days=28)
|
2022-03-12 13:33:15 +01:00
|
|
|
|
2023-11-30 21:05:34 +01:00
|
|
|
query = StreamCount.objects.filter(
|
|
|
|
# The realm_id is important, as it makes this significantly better-indexed
|
|
|
|
realm_id=realm.id,
|
|
|
|
stream_id__in=stream_ids,
|
|
|
|
property=stat.property,
|
|
|
|
end_time__gt=traffic_from,
|
|
|
|
)
|
2022-03-12 13:33:15 +01:00
|
|
|
|
|
|
|
traffic_list = query.values("stream_id").annotate(value=Sum("value"))
|
|
|
|
traffic_dict = {}
|
|
|
|
for traffic in traffic_list:
|
|
|
|
traffic_dict[traffic["stream_id"]] = traffic["value"]
|
|
|
|
|
|
|
|
return traffic_dict
|
|
|
|
|
|
|
|
|
|
|
|
def round_to_2_significant_digits(number: int) -> int:
|
|
|
|
return int(round(number, 2 - len(str(number))))
|
|
|
|
|
|
|
|
|
|
|
|
STREAM_TRAFFIC_CALCULATION_MIN_AGE_DAYS = 7
|
|
|
|
|
|
|
|
|
|
|
|
def get_average_weekly_stream_traffic(
|
2024-07-12 02:30:17 +02:00
|
|
|
stream_id: int, stream_date_created: datetime, recent_traffic: dict[int, int]
|
2024-07-12 02:30:23 +02:00
|
|
|
) -> int | None:
|
2022-03-12 13:33:15 +01:00
|
|
|
try:
|
|
|
|
stream_traffic = recent_traffic[stream_id]
|
|
|
|
except KeyError:
|
|
|
|
stream_traffic = 0
|
|
|
|
|
|
|
|
stream_age = (timezone_now() - stream_date_created).days
|
|
|
|
|
|
|
|
if stream_age >= 28:
|
|
|
|
average_weekly_traffic = int(stream_traffic // 4)
|
|
|
|
elif stream_age >= STREAM_TRAFFIC_CALCULATION_MIN_AGE_DAYS:
|
|
|
|
average_weekly_traffic = int(stream_traffic * 7 // stream_age)
|
|
|
|
else:
|
|
|
|
return None
|
|
|
|
|
|
|
|
if average_weekly_traffic == 0 and stream_traffic > 0:
|
|
|
|
average_weekly_traffic = 1
|
|
|
|
|
|
|
|
return round_to_2_significant_digits(average_weekly_traffic)
|