import os import time from argparse import ArgumentParser from datetime import timezone from typing import Any, Dict from django.conf import settings from django.core.management.base import BaseCommand from django.utils.dateparse import parse_datetime from django.utils.timezone import now as timezone_now from analytics.lib.counts import COUNT_STATS, logger, process_count_stat from scripts.lib.zulip_tools import ENDC, WARNING from zerver.lib.remote_server import send_analytics_to_remote_server from zerver.lib.timestamp import floor_to_hour from zerver.models import Realm class Command(BaseCommand): help = """Fills Analytics tables. Run as a cron job that runs every hour.""" def add_arguments(self, parser: ArgumentParser) -> None: parser.add_argument('--time', '-t', help='Update stat tables from current state to' '--time. Defaults to the current time.', default=timezone_now().isoformat()) parser.add_argument('--utc', action='store_true', help="Interpret --time in UTC.") parser.add_argument('--stat', '-s', help="CountStat to process. If omitted, all stats are processed.") parser.add_argument('--verbose', action='store_true', help="Print timing information to stdout.") def handle(self, *args: Any, **options: Any) -> None: try: os.mkdir(settings.ANALYTICS_LOCK_DIR) except OSError: print(f"{WARNING}Analytics lock {settings.ANALYTICS_LOCK_DIR} is unavailable;" f" exiting.{ENDC}") return try: self.run_update_analytics_counts(options) finally: os.rmdir(settings.ANALYTICS_LOCK_DIR) def run_update_analytics_counts(self, options: Dict[str, Any]) -> None: # installation_epoch relies on there being at least one realm; we # shouldn't run the analytics code if that condition isn't satisfied if not Realm.objects.exists(): logger.info("No realms, stopping update_analytics_counts") return fill_to_time = parse_datetime(options['time']) if options['utc']: fill_to_time = fill_to_time.replace(tzinfo=timezone.utc) if fill_to_time.tzinfo is None: raise ValueError("--time must be timezone aware. Maybe you meant to use the --utc option?") fill_to_time = floor_to_hour(fill_to_time.astimezone(timezone.utc)) if options['stat'] is not None: stats = [COUNT_STATS[options['stat']]] else: stats = list(COUNT_STATS.values()) logger.info("Starting updating analytics counts through %s", fill_to_time) if options['verbose']: start = time.time() last = start for stat in stats: process_count_stat(stat, fill_to_time) if options['verbose']: print(f"Updated {stat.property} in {time.time() - last:.3f}s") last = time.time() if options['verbose']: print(f"Finished updating analytics counts through {fill_to_time} in {time.time() - start:.3f}s") logger.info("Finished updating analytics counts through %s", fill_to_time) if settings.PUSH_NOTIFICATION_BOUNCER_URL and settings.SUBMIT_USAGE_STATISTICS: send_analytics_to_remote_server()