zulip/zerver/lib/rate_limiter.py

import logging
import time
from abc import ABC, abstractmethod
from typing import Optional, cast

import orjson
import redis
from circuitbreaker import CircuitBreakerError, circuit
from django.conf import settings
from django.http import HttpRequest
from typing_extensions import override

from zerver.lib import redis_utils
from zerver.lib.cache import cache_with_key
from zerver.lib.exceptions import RateLimitedError
from zerver.lib.redis_utils import get_redis_client
from zerver.models import UserProfile

# Implement a rate-limiting scheme inspired by the one described here, but heavily modified
# https://www.domaintools.com/resources/blog/rate-limiting-with-redis

client = get_redis_client()
rules: dict[str, list[tuple[int, int]]] = settings.RATE_LIMITING_RULES

logger = logging.getLogger(__name__)


class RateLimiterLockingError(Exception):
    pass


class RateLimitedObject(ABC):
    def __init__(self, backend: Optional["type[RateLimiterBackend]"] = None) -> None:
        if backend is not None:
            self.backend: type[RateLimiterBackend] = backend
        else:
            self.backend = RedisRateLimiterBackend

    def rate_limit(self) -> tuple[bool, float]:
        # Returns (ratelimited, secs_to_freedom)
        return self.backend.rate_limit_entity(
            self.key(), self.get_rules(), self.max_api_calls(), self.max_api_window()
        )

    def rate_limit_request(self, request: HttpRequest) -> None:
        from zerver.lib.request import RequestNotes

        ratelimited, time = self.rate_limit()
        request_notes = RequestNotes.get_notes(request)

        request_notes.ratelimits_applied.append(
            RateLimitResult(
                entity=self,
                secs_to_freedom=time,
                remaining=0,
                over_limit=ratelimited,
            )
        )
        # Abort this request if the user is over their rate limits
        if ratelimited:
            # Pass information about what kind of entity got limited in the exception:
            raise RateLimitedError(time)

        calls_remaining, seconds_until_reset = self.api_calls_left()

        request_notes.ratelimits_applied[-1].remaining = calls_remaining
        request_notes.ratelimits_applied[-1].secs_to_freedom = seconds_until_reset

    def block_access(self, seconds: int) -> None:
        """Manually blocks an entity for the desired number of seconds"""
        self.backend.block_access(self.key(), seconds)

    def unblock_access(self) -> None:
        self.backend.unblock_access(self.key())

    def clear_history(self) -> None:
        self.backend.clear_history(self.key())

    def max_api_calls(self) -> int:
        """Returns the API rate limit for the highest limit"""
        return self.get_rules()[-1][1]

    def max_api_window(self) -> int:
        """Returns the API time window for the highest limit"""
        return self.get_rules()[-1][0]

    def api_calls_left(self) -> tuple[int, float]:
        """Returns how many API calls in this range this client has, as well as when
        the rate-limit will be reset to 0"""
        max_window = self.max_api_window()
        max_calls = self.max_api_calls()
        return self.backend.get_api_calls_left(self.key(), max_window, max_calls)

    def get_rules(self) -> list[tuple[int, int]]:
        """
        This is a simple wrapper meant to protect against having to deal with
        an empty list of rules, as it would require fiddling with that special case
        all around this system. "9999 max request per seconds" should be a good proxy
        for "no rules".
        """
        rules_list = self.rules()
        return rules_list or [(1, 9999)]

    @abstractmethod
    def key(self) -> str:
        pass

    @abstractmethod
    def rules(self) -> list[tuple[int, int]]:
        pass


class RateLimitedUser(RateLimitedObject):
    def __init__(self, user: UserProfile, domain: str = "api_by_user") -> None:
        self.user_id = user.id
        self.rate_limits = user.rate_limits
        self.domain = domain
        if settings.RUNNING_INSIDE_TORNADO and domain in settings.RATE_LIMITING_DOMAINS_FOR_TORNADO:
            backend: type[RateLimiterBackend] | None = TornadoInMemoryRateLimiterBackend
        else:
            backend = None
        super().__init__(backend=backend)

    @override
    def key(self) -> str:
        return f"{type(self).__name__}:{self.user_id}:{self.domain}"

    @override
    def rules(self) -> list[tuple[int, int]]:
        # user.rate_limits are general limits, applicable to the domain 'api_by_user'
        if self.rate_limits != "" and self.domain == "api_by_user":
            result: list[tuple[int, int]] = []
            for limit in self.rate_limits.split(","):
                (seconds, requests) = limit.split(":", 2)
                result.append((int(seconds), int(requests)))
            return result
        return rules[self.domain]


class RateLimitedIPAddr(RateLimitedObject):
    def __init__(self, ip_addr: str, domain: str = "api_by_ip") -> None:
        self.ip_addr = ip_addr
        self.domain = domain
        if settings.RUNNING_INSIDE_TORNADO and domain in settings.RATE_LIMITING_DOMAINS_FOR_TORNADO:
            backend: type[RateLimiterBackend] | None = TornadoInMemoryRateLimiterBackend
        else:
            backend = None
        super().__init__(backend=backend)

    @override
    def key(self) -> str:
        # The angle brackets are important since IPv6 addresses contain :.
        return f"{type(self).__name__}:<{self.ip_addr}>:{self.domain}"

    @override
    def rules(self) -> list[tuple[int, int]]:
        return rules[self.domain]


class RateLimiterBackend(ABC):
    @classmethod
    @abstractmethod
    def block_access(cls, entity_key: str, seconds: int) -> None:
        """Manually blocks an entity for the desired number of seconds"""

    @classmethod
    @abstractmethod
    def unblock_access(cls, entity_key: str) -> None:
        pass

    @classmethod
    @abstractmethod
    def clear_history(cls, entity_key: str) -> None:
        pass

    @classmethod
    @abstractmethod
    def get_api_calls_left(
        cls, entity_key: str, range_seconds: int, max_calls: int
    ) -> tuple[int, float]:
        pass

    @classmethod
    @abstractmethod
    def rate_limit_entity(
        cls, entity_key: str, rules: list[tuple[int, int]], max_api_calls: int, max_api_window: int
    ) -> tuple[bool, float]:
        # Returns (ratelimited, secs_to_freedom)
        pass


class TornadoInMemoryRateLimiterBackend(RateLimiterBackend):
    # reset_times[rule][key] is the time at which the event
    # request from the rate-limited key will be accepted.
    reset_times: dict[tuple[int, int], dict[str, float]] = {}

    # last_gc_time is the last time when the garbage was
    # collected from reset_times for rule (time_window, max_count).
    last_gc_time: dict[tuple[int, int], float] = {}

    # timestamps_blocked_until[key] contains the timestamp
    # up to which the key has been blocked manually.
    timestamps_blocked_until: dict[str, float] = {}

    @classmethod
    def _garbage_collect_for_rule(cls, now: float, time_window: int, max_count: int) -> None:
        keys_to_delete = []
        reset_times_for_rule = cls.reset_times.get((time_window, max_count), None)
        if reset_times_for_rule is None:
            return

        keys_to_delete = [
            entity_key
            for entity_key in reset_times_for_rule
            if reset_times_for_rule[entity_key] < now
        ]

        for entity_key in keys_to_delete:
            del reset_times_for_rule[entity_key]

        if not reset_times_for_rule:
            del cls.reset_times[(time_window, max_count)]

    @classmethod
    def need_to_limit(cls, entity_key: str, time_window: int, max_count: int) -> tuple[bool, float]:
        """
        Returns a tuple of `(rate_limited, time_till_free)`.
        For simplicity, we have loosened the semantics here from
        - each key may make at most `count * (t / window)` request within any t
          time interval.
        to
        - each key may make at most `count * [(t / window) + 1]` request within
          any t time interval.
        Thus, we only need to store reset_times for each key which will be less
        memory-intensive. This also has the advantage that you can only ever
        lock yourself out completely for `window / count` seconds instead of
        `window` seconds.
        """
        now = time.time()

        # Remove all timestamps from `reset_times` that are too old.
        if cls.last_gc_time.get((time_window, max_count), 0) <= now - time_window / max_count:
            cls.last_gc_time[(time_window, max_count)] = now
            cls._garbage_collect_for_rule(now, time_window, max_count)

        reset_times_for_rule = cls.reset_times.setdefault((time_window, max_count), {})
        new_reset = max(reset_times_for_rule.get(entity_key, now), now) + time_window / max_count

        if new_reset > now + time_window:
            # Compute for how long the bucket will remain filled.
            time_till_free = new_reset - time_window - now
            return True, time_till_free

        reset_times_for_rule[entity_key] = new_reset
        return False, 0.0

    @classmethod
    @override
    def get_api_calls_left(
        cls, entity_key: str, range_seconds: int, max_calls: int
    ) -> tuple[int, float]:
        now = time.time()
        if (range_seconds, max_calls) in cls.reset_times and entity_key in cls.reset_times[
            (range_seconds, max_calls)
        ]:
            reset_time = cls.reset_times[(range_seconds, max_calls)][entity_key]
        else:
            return max_calls, 0

        calls_remaining = (now + range_seconds - reset_time) * max_calls // range_seconds
        return int(calls_remaining), reset_time - now

    @classmethod
    @override
    def block_access(cls, entity_key: str, seconds: int) -> None:
        now = time.time()
        cls.timestamps_blocked_until[entity_key] = now + seconds

    @classmethod
    @override
    def unblock_access(cls, entity_key: str) -> None:
        del cls.timestamps_blocked_until[entity_key]

    @classmethod
    @override
    def clear_history(cls, entity_key: str) -> None:
        for reset_times_for_rule in cls.reset_times.values():
            reset_times_for_rule.pop(entity_key, None)
        cls.timestamps_blocked_until.pop(entity_key, None)

    @classmethod
    @override
    def rate_limit_entity(
        cls, entity_key: str, rules: list[tuple[int, int]], max_api_calls: int, max_api_window: int
    ) -> tuple[bool, float]:
        now = time.time()
        if entity_key in cls.timestamps_blocked_until:
            # Check whether the key is manually blocked.
            if now < cls.timestamps_blocked_until[entity_key]:
                blocking_ttl = cls.timestamps_blocked_until[entity_key] - now
                return True, blocking_ttl
            else:
                del cls.timestamps_blocked_until[entity_key]

        assert rules
        for time_window, max_count in rules:
            ratelimited, time_till_free = cls.need_to_limit(entity_key, time_window, max_count)

            if ratelimited:
                break

        return ratelimited, time_till_free


class RedisRateLimiterBackend(RateLimiterBackend):
    @classmethod
    def get_keys(cls, entity_key: str) -> list[str]:
        return [
            f"{redis_utils.REDIS_KEY_PREFIX}ratelimit:{entity_key}:{keytype}"
            for keytype in ["list", "zset", "block"]
        ]

    @classmethod
    @override
    def block_access(cls, entity_key: str, seconds: int) -> None:
        """Manually blocks an entity for the desired number of seconds"""
        _, _, blocking_key = cls.get_keys(entity_key)
        with client.pipeline() as pipe:
            pipe.set(blocking_key, 1)
            pipe.expire(blocking_key, seconds)
            pipe.execute()

    @classmethod
    @override
    def unblock_access(cls, entity_key: str) -> None:
        _, _, blocking_key = cls.get_keys(entity_key)
        client.delete(blocking_key)

    @classmethod
    @override
    def clear_history(cls, entity_key: str) -> None:
        for key in cls.get_keys(entity_key):
            client.delete(key)

    @classmethod
    @override
    def get_api_calls_left(
        cls, entity_key: str, range_seconds: int, max_calls: int
    ) -> tuple[int, float]:
        list_key, set_key, _ = cls.get_keys(entity_key)
        # Count the number of values in our sorted set
        # that are between now and the cutoff
        now = time.time()
        boundary = now - range_seconds

        with client.pipeline() as pipe:
            # Count how many API calls in our range have already been made
            pipe.zcount(set_key, boundary, now)
            # Get the newest call so we can calculate when the ratelimit
            # will reset to 0
            pipe.lindex(list_key, 0)

            results = pipe.execute()

        count: int = results[0]
        newest_call: bytes | None = results[1]

        calls_left = max_calls - count
        if newest_call is not None:
            time_reset = now + (range_seconds - (now - float(newest_call)))
        else:
            time_reset = now

        return calls_left, time_reset - now

    @classmethod
    def is_ratelimited(cls, entity_key: str, rules: list[tuple[int, int]]) -> tuple[bool, float]:
        """Returns a tuple of (rate_limited, time_till_free)"""
        assert rules
        list_key, set_key, blocking_key = cls.get_keys(entity_key)

        # Go through the rules from shortest to longest,
        # seeing if this user has violated any of them. First
        # get the timestamps for each nth items
        with client.pipeline() as pipe:
            for _, request_count in rules:
                pipe.lindex(list_key, request_count - 1)  # 0-indexed list

            # Get blocking info
            pipe.get(blocking_key)
            pipe.ttl(blocking_key)

            rule_timestamps: list[bytes | None] = pipe.execute()

        # Check if there is a manual block on this API key
        blocking_ttl_b = rule_timestamps.pop()
        key_blocked = rule_timestamps.pop()

        if key_blocked is not None:
            # We are manually blocked. Report for how much longer we will be
            if blocking_ttl_b is None:  # nocoverage # defensive code, this should never happen
                blocking_ttl = 0.5
            else:
                blocking_ttl = int(blocking_ttl_b)
            return True, blocking_ttl

        now = time.time()
        for timestamp, (range_seconds, num_requests) in zip(rule_timestamps, rules, strict=False):
            # Check if the nth timestamp is newer than the associated rule. If so,
            # it means we've hit our limit for this rule
            if timestamp is None:
                continue

            boundary = float(timestamp) + range_seconds
            if boundary >= now:
                free = boundary - now
                return True, free

        return False, 0.0

    @classmethod
    def incr_ratelimit(cls, entity_key: str, max_api_calls: int, max_api_window: int) -> None:
        """Increases the rate-limit for the specified entity"""
        list_key, set_key, _ = cls.get_keys(entity_key)
        now = time.time()

        # Start Redis transaction
        with client.pipeline() as pipe:
            count = 0
            while True:
                try:
                    # To avoid a race condition between getting the element we might trim from our list
                    # and removing it from our associated set, we abort this whole transaction if
                    # another agent manages to change our list out from under us
                    # When watching a value, the pipeline is set to Immediate mode
                    pipe.watch(list_key)

                    # Get the last elem that we'll trim (so we can remove it from our sorted set)
                    last_val = cast(  # mypy doesn’t know the pipe is in immediate mode
                        bytes | None, pipe.lindex(list_key, max_api_calls - 1)
                    )

                    # Restart buffered execution
                    pipe.multi()

                    # Add this timestamp to our list
                    pipe.lpush(list_key, now)

                    # Trim our list to the oldest rule we have
                    pipe.ltrim(list_key, 0, max_api_calls - 1)

                    # Add our new value to the sorted set that we keep
                    # We need to put the score and val both as timestamp,
                    # as we sort by score but remove by value
                    pipe.zadd(set_key, {str(now): now})

                    # Remove the trimmed value from our sorted set, if there was one
                    if last_val is not None:
                        pipe.zrem(set_key, last_val)

                    # Set the TTL for our keys as well
                    api_window = max_api_window
                    pipe.expire(list_key, api_window)
                    pipe.expire(set_key, api_window)

                    pipe.execute()

                    # If no exception was raised in the execution, there were no transaction conflicts
                    break
                except redis.WatchError:  # nocoverage # Ideally we'd have a test for this.
                    if count > 10:
                        raise RateLimiterLockingError
                    count += 1

                    continue

    @classmethod
    @override
    def rate_limit_entity(
        cls, entity_key: str, rules: list[tuple[int, int]], max_api_calls: int, max_api_window: int
    ) -> tuple[bool, float]:
        ratelimited, time = cls.is_ratelimited(entity_key, rules)

        if not ratelimited:
            try:
                cls.incr_ratelimit(entity_key, max_api_calls, max_api_window)
            except RateLimiterLockingError:
                logger.warning("Deadlock trying to incr_ratelimit for %s", entity_key)
                # rate-limit users who are hitting the API so hard we can't update our stats.
                ratelimited = True

        return ratelimited, time


class RateLimitResult:
    def __init__(
        self, entity: RateLimitedObject, secs_to_freedom: float, over_limit: bool, remaining: int
    ) -> None:
        if over_limit:
            assert not remaining

        self.entity = entity
        self.secs_to_freedom = secs_to_freedom
        self.over_limit = over_limit
        self.remaining = remaining


class RateLimitedSpectatorAttachmentAccessByFile(RateLimitedObject):
    def __init__(self, path_id: str) -> None:
        self.path_id = path_id
        super().__init__()

    @override
    def key(self) -> str:
        return f"{type(self).__name__}:{self.path_id}"

    @override
    def rules(self) -> list[tuple[int, int]]:
        return settings.RATE_LIMITING_RULES["spectator_attachment_access_by_file"]


def rate_limit_spectator_attachment_access_by_file(path_id: str) -> None:
    ratelimited, _ = RateLimitedSpectatorAttachmentAccessByFile(path_id).rate_limit()
    if ratelimited:
        raise RateLimitedError


def is_local_addr(addr: str) -> bool:
    return addr in ("127.0.0.1", "::1")


@cache_with_key(lambda: "tor_ip_addresses:", timeout=60 * 60)
@circuit(failure_threshold=2, recovery_timeout=60 * 10)
def get_tor_ips() -> set[str]:
    if not settings.RATE_LIMIT_TOR_TOGETHER:
        return set()

    # Cron job in /etc/cron.d/fetch-tor-exit-nodes fetches this
    # hourly; we cache it in memcached to prevent going to disk on
    # every unauth'd request.  In case of failures to read, we
    # circuit-break so 2 failures cause a 10-minute backoff.

    with open(settings.TOR_EXIT_NODE_FILE_PATH, "rb") as f:
        exit_node_list = orjson.loads(f.read())

    # This should always be non-empty; if it's empty, assume something
    # went wrong with writing and treat it as a non-existent file.
    # Circuit-breaking will ensure that we back off on re-reading the
    # file.
    if len(exit_node_list) == 0:
        raise OSError("File is empty")

    return set(exit_node_list)


def client_is_exempt_from_rate_limiting(request: HttpRequest) -> bool:
    from zerver.lib.request import RequestNotes

    # Don't rate limit requests from Django that come from our own servers,
    # and don't rate-limit dev instances
    client = RequestNotes.get_notes(request).client
    return (client is not None and client.name.lower() == "internal") and (
        is_local_addr(request.META["REMOTE_ADDR"]) or settings.DEBUG_RATE_LIMITING
    )


def rate_limit_user(request: HttpRequest, user: UserProfile, domain: str) -> None:
    """Returns whether or not a user was rate limited. Will raise a RateLimitedError exception
    if the user has been rate limited, otherwise returns and modifies request to contain
    the rate limit information"""
    if not should_rate_limit(request):
        return

    RateLimitedUser(user, domain=domain).rate_limit_request(request)


def rate_limit_request_by_ip(request: HttpRequest, domain: str) -> None:
    if not should_rate_limit(request):
        return

    # REMOTE_ADDR is set by SetRemoteAddrFromRealIpHeader in conjunction
    # with the nginx configuration to guarantee this to be *the* correct
    # IP address to use - without worrying we'll grab the IP of a proxy.
    ip_addr = request.META["REMOTE_ADDR"]
    assert ip_addr

    try:
        # We lump all TOR exit nodes into one bucket; this prevents
        # abuse from TOR, while still allowing some access to these
        # endpoints for legitimate users.  Checking for local
        # addresses is a shortcut somewhat for ease of testing without
        # mocking the TOR endpoint in every test.
        if is_local_addr(ip_addr):
            pass
        elif ip_addr in get_tor_ips():
            ip_addr = "tor-exit-node"
    except (OSError, CircuitBreakerError) as err:
        # In the event that we can't get an updated list of TOR exit
        # nodes, assume the IP is _not_ one, and leave it unchanged.
        # We log a warning so that this endpoint being taken out of
        # service doesn't silently remove this functionality.
        logger.warning("Failed to fetch TOR exit node list: %s", err)
    RateLimitedIPAddr(ip_addr, domain=domain).rate_limit_request(request)


def should_rate_limit(request: HttpRequest) -> bool:
    if not settings.RATE_LIMITING:
        return False

    if client_is_exempt_from_rate_limiting(request):
        return False

    return True
-												python: Sort imports with isort.

Fixes #2665.

Regenerated by tabbott with `lint --fix` after a rebase and change in
parameters.

Note from tabbott: In a few cases, this converts technical debt in the
form of unsorted imports into different technical debt in the form of
our largest files having very long, ugly import sequences at the
start.  I expect this change will increase pressure for us to split
those files, which isn't a bad thing.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2020-06-11 00:54:34 +02:00
+								import logging
 								import time
-												rate_limiter: Use ABC for defining the abstract class RateLimitedObject.

											
										
										
											2019-12-30 02:26:08 +01:00
+								from abc import ABC, abstractmethod
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								from typing import Optional, cast
-												Annotation of zerver/lib/rate_limiter.py

											
										
										
											2016-03-27 12:09:54 +02:00
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
+								import orjson
-												python: Sort imports with isort.

Fixes #2665.

Regenerated by tabbott with `lint --fix` after a rebase and change in
parameters.

Note from tabbott: In a few cases, this converts technical debt in the
form of unsorted imports into different technical debt in the form of
our largest files having very long, ugly import sequences at the
start.  I expect this change will increase pressure for us to split
those files, which isn't a bad thing.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2020-06-11 00:54:34 +02:00
+								import redis
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
+								from circuitbreaker import CircuitBreakerError, circuit
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
+								from django.conf import settings
-												rate_limiter: Create a general rate_limit_request_by_entity function.

											
										
										
											2019-04-01 20:11:56 +02:00
+								from django.http import HttpRequest
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								from typing_extensions import override
-												python: Sort imports with isort.

Fixes #2665.

Regenerated by tabbott with `lint --fix` after a rebase and change in
parameters.

Note from tabbott: In a few cases, this converts technical debt in the
form of unsorted imports into different technical debt in the form of
our largest files having very long, ugly import sequences at the
start.  I expect this change will increase pressure for us to split
those files, which isn't a bad thing.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2020-06-11 00:54:34 +02:00
-												rate_limiter: Extract KEY_PREFIX to redis_utils.

											
										
										
											2024-03-19 02:46:33 +01:00
+								from zerver.lib import redis_utils
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
+								from zerver.lib.cache import cache_with_key
-												ruff: Fix N818 exception name should be named with an Error suffix.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-11-17 09:30:48 +01:00
+								from zerver.lib.exceptions import RateLimitedError
-												Add helper function for returning a Redis client

(imported from commit 47f87d388d24343ac6b631181a55287eb8cd4a6d)

											
										
										
											2014-02-05 00:35:32 +01:00
+								from zerver.lib.redis_utils import get_redis_client
-												Annotation of zerver/lib/rate_limiter.py

											
										
										
											2016-03-27 12:09:54 +02:00
+								from zerver.models import UserProfile
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
+								# Implement a rate-limiting scheme inspired by the one described here, but heavily modified
-												docs: Convert many http URLs to https.

Signed-off-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-27 01:32:21 +01:00
+								# https://www.domaintools.com/resources/blog/rate-limiting-with-redis
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												Add helper function for returning a Redis client

(imported from commit 47f87d388d24343ac6b631181a55287eb8cd4a6d)

											
										
										
											2014-02-05 00:35:32 +01:00
+								client = get_redis_client()
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								rules: dict[str, list[tuple[int, int]]] = settings.RATE_LIMITING_RULES
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limiter: Generalise some rate_limit_user code.

We create rate_limit_entity as a general rate-limiting function for
RateLimitedObjects, from code that was possible to abstract away from
rate_limit_user and that will be used for other kinds of rate limiting.
We make rate_limit_user use this new general framework from now.

											
										
										
											2019-03-23 18:33:37 +01:00
+								logger = logging.getLogger(__name__)
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
-												ruff: Fix N818 exception name should be named with an Error suffix.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-11-17 09:30:48 +01:00
+								class RateLimiterLockingError(Exception):
-												rate_limiter: Improve handling of deadlocks.

We should rate-limit users when our rate limiter deadlocks trying to
increment its count; we also now log at warning level (so it doesn't
send spammy emails) and include details on the user and route was, so
that we can properly investigate whether the rate-limiting on the
route was in error.

											
										
										
											2018-12-12 21:13:00 +01:00
+								    pass
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
-												rate_limiter: Use ABC for defining the abstract class RateLimitedObject.

											
										
										
											2019-12-30 02:26:08 +01:00
+								class RateLimitedObject(ABC):
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def __init__(self, backend: Optional["type[RateLimiterBackend]"] = None) -> None:
-												rate_limiter: Add more detailed automated tests.

Extracted by tabbott from the original commit to support testing
without the Tornado version merged yet.

											
										
										
											2020-04-02 20:40:10 +02:00
+								        if backend is not None:
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								            self.backend: type[RateLimiterBackend] = backend
-												rate_limiter: Add more detailed automated tests.

Extracted by tabbott from the original commit to support testing
without the Tornado version merged yet.

											
										
										
											2020-04-02 20:40:10 +02:00
+								        else:
 								            self.backend = RedisRateLimiterBackend
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def rate_limit(self) -> tuple[bool, float]:
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
+								        # Returns (ratelimited, secs_to_freedom)
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								        return self.backend.rate_limit_entity(
 								            self.key(), self.get_rules(), self.max_api_calls(), self.max_api_window()
 								        )
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
 								    def rate_limit_request(self, request: HttpRequest) -> None:
-												request: Refactor ZulipRequestNotes to RequestNotes.

This utilizes the generic `BaseNotes` we added for multipurpose
patching. With this migration as an example, we can further support
more types of notes to replace the monkey-patching approach we have used
throughout the codebase for type safety.

											
										
										
											2021-08-21 19:24:20 +02:00
+								        from zerver.lib.request import RequestNotes
-												Revert "Revert "request: Refactor to record rate limit data using ZulipRequestNotes.""

This reverts commit 49eab4efef8d9e1561f926f1e4db47e66d5e6807.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-07-19 23:27:29 +02:00
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
+								        ratelimited, time = self.rate_limit()
-												request: Refactor ZulipRequestNotes to RequestNotes.

This utilizes the generic `BaseNotes` we added for multipurpose
patching. With this migration as an example, we can further support
more types of notes to replace the monkey-patching approach we have used
throughout the codebase for type safety.

											
										
										
											2021-08-21 19:24:20 +02:00
+								        request_notes = RequestNotes.get_notes(request)
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
-												Revert "Revert "request: Refactor to record rate limit data using ZulipRequestNotes.""

This reverts commit 49eab4efef8d9e1561f926f1e4db47e66d5e6807.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-07-19 23:27:29 +02:00
+								        request_notes.ratelimits_applied.append(
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								            RateLimitResult(
 								                entity=self,
 								                secs_to_freedom=time,
 								                remaining=0,
 								                over_limit=ratelimited,
 								            )
 								        )
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
+								        # Abort this request if the user is over their rate limits
 								        if ratelimited:
 								            # Pass information about what kind of entity got limited in the exception:
-												ruff: Fix N818 exception name should be named with an Error suffix.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-11-17 09:30:48 +01:00
+								            raise RateLimitedError(time)
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
-												rate_limiter: Fix secs_to_freedom being set to a timestamp.

time_reset returned from api_calls_left() was a timestamp, but
mistakenly treated as delta seconds. We change the return value of
api_calls_left() to be delta seconds, to be consistent with the return
value of rate_limit().

											
										
										
											2020-04-01 18:44:19 +02:00
+								        calls_remaining, seconds_until_reset = self.api_calls_left()
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
-												Revert "Revert "request: Refactor to record rate limit data using ZulipRequestNotes.""

This reverts commit 49eab4efef8d9e1561f926f1e4db47e66d5e6807.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-07-19 23:27:29 +02:00
+								        request_notes.ratelimits_applied[-1].remaining = calls_remaining
 								        request_notes.ratelimits_applied[-1].secs_to_freedom = seconds_until_reset
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
 								    def block_access(self, seconds: int) -> None:
-												ruff: Fix Q002 Single quote docstring found.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-12-14 10:46:29 +01:00
+								        """Manually blocks an entity for the desired number of seconds"""
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        self.backend.block_access(self.key(), seconds)
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
 								    def unblock_access(self) -> None:
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        self.backend.unblock_access(self.key())
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
 								    def clear_history(self) -> None:
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        self.backend.clear_history(self.key())
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
 								    def max_api_calls(self) -> int:
-												ruff: Fix Q002 Single quote docstring found.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-12-14 10:46:29 +01:00
+								        """Returns the API rate limit for the highest limit"""
-												rate_limiter: Handle edge case where rules list may be empty.

											
										
										
											2020-04-02 22:23:20 +02:00
+								        return self.get_rules()[-1][1]
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
 								    def max_api_window(self) -> int:
-												ruff: Fix Q002 Single quote docstring found.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-12-14 10:46:29 +01:00
+								        """Returns the API time window for the highest limit"""
-												rate_limiter: Handle edge case where rules list may be empty.

											
										
										
											2020-04-02 22:23:20 +02:00
+								        return self.get_rules()[-1][0]
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def api_calls_left(self) -> tuple[int, float]:
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
+								        """Returns how many API calls in this range this client has, as well as when
 								        the rate-limit will be reset to 0"""
 								        max_window = self.max_api_window()
 								        max_calls = self.max_api_calls()
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        return self.backend.get_api_calls_left(self.key(), max_window, max_calls)
-												rate_limit: Move functions called by external code to RateLimitedObject.

											
										
										
											2020-03-04 14:05:25 +01:00
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def get_rules(self) -> list[tuple[int, int]]:
-												rate_limiter: Handle edge case where rules list may be empty.

											
										
										
											2020-04-02 22:23:20 +02:00
+								        """
 								        This is a simple wrapper meant to protect against having to deal with
 								        an empty list of rules, as it would require fiddling with that special case
 								        all around this system. "9999 max request per seconds" should be a good proxy
 								        for "no rules".
 								        """
 								        rules_list = self.rules()
-												python: Use trailing commas consistently.

Automatically generated by the following script, based on the output
of lint with flake8-comma:

import re
import sys

last_filename = None
last_row = None
lines = []

for msg in sys.stdin:
    m = re.match(
        r"\x1b\[35mflake8    \|\x1b\[0m \x1b\[1;31m(.+):(\d+):(\d+): (\w+)", msg
    )
    if m:
        filename, row_str, col_str, err = m.groups()
        row, col = int(row_str), int(col_str)

        if filename == last_filename:
            assert last_row != row
        else:
            if last_filename is not None:
                with open(last_filename, "w") as f:
                    f.writelines(lines)

            with open(filename) as f:
                lines = f.readlines()
            last_filename = filename
        last_row = row

        line = lines[row - 1]
        if err in ["C812", "C815"]:
            lines[row - 1] = line[: col - 1] + "," + line[col - 1 :]
        elif err in ["C819"]:
            assert line[col - 2] == ","
            lines[row - 1] = line[: col - 2] + line[col - 1 :].lstrip(" ")

if last_filename is not None:
    with open(last_filename, "w") as f:
        f.writelines(lines)

Signed-off-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-04-10 05:23:40 +02:00
+								        return rules_list or [(1, 9999)]
-												rate_limiter: Handle edge case where rules list may be empty.

											
										
										
											2020-04-02 22:23:20 +02:00
-												rate_limiter: Use ABC for defining the abstract class RateLimitedObject.

											
										
										
											2019-12-30 02:26:08 +01:00
+								    @abstractmethod
-												rate_limit: Rename key_fragment() method to key().

											
										
										
											2020-03-06 10:49:04 +01:00
+								    def key(self) -> str:
-												rate_limiter: Use ABC for defining the abstract class RateLimitedObject.

											
										
										
											2019-12-30 02:26:08 +01:00
+								        pass
-												rate_limiter: Use RateLimitedUser class.

This commit lays groundwork for transitioning to using RateLimited
class in our rate limiter API.

											
										
										
											2017-07-28 06:40:52 +02:00
-												rate_limiter: Use ABC for defining the abstract class RateLimitedObject.

											
										
										
											2019-12-30 02:26:08 +01:00
+								    @abstractmethod
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def rules(self) -> list[tuple[int, int]]:
-												rate_limiter: Use ABC for defining the abstract class RateLimitedObject.

											
										
										
											2019-12-30 02:26:08 +01:00
+								        pass
-												rate_limiter: Use RateLimitedUser class.

This commit lays groundwork for transitioning to using RateLimited
class in our rate limiter API.

											
										
										
											2017-07-28 06:40:52 +02:00
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
-												rate_limiter: Use RateLimitedUser class.

This commit lays groundwork for transitioning to using RateLimited
class in our rate limiter API.

											
										
										
											2017-07-28 06:40:52 +02:00
+								class RateLimitedUser(RateLimitedObject):
-												python: Normalize quotes with Black.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:20:45 +01:00
+								    def __init__(self, user: UserProfile, domain: str = "api_by_user") -> None:
-												rate_limiter: Avoid strong reference to user.

This prevents a memory leak caused by the `SimpleLazyObject` instance of
`UserProfile` that create a reference loop with the request object
via `ZulipRequestNotes`.

											
										
										
											2021-07-20 07:26:36 +02:00
+								        self.user_id = user.id
 								        self.rate_limits = user.rate_limits
-												rate_limiter: Use RateLimitedUser class.

This commit lays groundwork for transitioning to using RateLimited
class in our rate limiter API.

											
										
										
											2017-07-28 06:40:52 +02:00
+								        self.domain = domain
-												rate_limit: Restrict tornado backend to explicitly specified domains.

This will protect us in case of some kinds of bugs that could allow
making requests such as password authentication attempts to tornado.
Without restricting the domains to which the in-memory backend can
be applied, such bugs would lead to attackers having multiple times
larger rate limits for these sensitive requests.

											
										
										
											2020-05-25 21:50:07 +02:00
+								        if settings.RUNNING_INSIDE_TORNADO and domain in settings.RATE_LIMITING_DOMAINS_FOR_TORNADO:
-												ruff: Fix UP007 Use `X | Y` for type annotations.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:23 +02:00
+								            backend: type[RateLimiterBackend] | None = TornadoInMemoryRateLimiterBackend
-												rate_limit: Restrict tornado backend to explicitly specified domains.

This will protect us in case of some kinds of bugs that could allow
making requests such as password authentication attempts to tornado.
Without restricting the domains to which the in-memory backend can
be applied, such bugs would lead to attackers having multiple times
larger rate limits for these sensitive requests.

											
										
										
											2020-05-25 21:50:07 +02:00
+								        else:
 								            backend = None
 								        super().__init__(backend=backend)
-												rate_limiter: Use RateLimitedUser class.

This commit lays groundwork for transitioning to using RateLimited
class in our rate limiter API.

											
										
										
											2017-07-28 06:40:52 +02:00
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												rate_limit: Rename key_fragment() method to key().

											
										
										
											2020-03-06 10:49:04 +01:00
+								    def key(self) -> str:
-												rate_limiter: Avoid strong reference to user.

This prevents a memory leak caused by the `SimpleLazyObject` instance of
`UserProfile` that create a reference loop with the request object
via `ZulipRequestNotes`.

											
										
										
											2021-07-20 07:26:36 +02:00
+								        return f"{type(self).__name__}:{self.user_id}:{self.domain}"
-												rate_limiter: Use RateLimitedUser class.

This commit lays groundwork for transitioning to using RateLimited
class in our rate limiter API.

											
										
										
											2017-07-28 06:40:52 +02:00
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def rules(self) -> list[tuple[int, int]]:
-												rate_limiter: Rename 'all' domain to 'api_by_user'.

											
										
										
											2019-08-03 20:39:49 +02:00
+								        # user.rate_limits are general limits, applicable to the domain 'api_by_user'
-												rate_limiter: Avoid strong reference to user.

This prevents a memory leak caused by the `SimpleLazyObject` instance of
`UserProfile` that create a reference loop with the request object
via `ZulipRequestNotes`.

											
										
										
											2021-07-20 07:26:36 +02:00
+								        if self.rate_limits != "" and self.domain == "api_by_user":
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								            result: list[tuple[int, int]] = []
-												rate_limiter: Avoid strong reference to user.

This prevents a memory leak caused by the `SimpleLazyObject` instance of
`UserProfile` that create a reference loop with the request object
via `ZulipRequestNotes`.

											
										
										
											2021-07-20 07:26:36 +02:00
+								            for limit in self.rate_limits.split(","):
-												python: Normalize quotes with Black.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:20:45 +01:00
+								                (seconds, requests) = limit.split(":", 2)
-												rate_limiter: Use RateLimitedUser class.

This commit lays groundwork for transitioning to using RateLimited
class in our rate limiter API.

											
										
										
											2017-07-28 06:40:52 +02:00
+								                result.append((int(seconds), int(requests)))
 								            return result
-												rate_limiter: Expand support for different domains.

											
										
										
											2019-04-01 21:18:26 +02:00
+								        return rules[self.domain]
-												rate_limiter: Use RateLimitedUser class.

This commit lays groundwork for transitioning to using RateLimited
class in our rate limiter API.

											
										
										
											2017-07-28 06:40:52 +02:00
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
-												rate_limit: Implement IP-based rate limiting.

If the user is logged in, we'll stick to rate limiting by the
UserProfile. In case of requests without authentication, we'll apply the
same limits but to the IP address.

											
										
										
											2021-07-08 14:46:47 +02:00
+								class RateLimitedIPAddr(RateLimitedObject):
 								    def __init__(self, ip_addr: str, domain: str = "api_by_ip") -> None:
 								        self.ip_addr = ip_addr
 								        self.domain = domain
 								        if settings.RUNNING_INSIDE_TORNADO and domain in settings.RATE_LIMITING_DOMAINS_FOR_TORNADO:
-												ruff: Fix UP007 Use `X | Y` for type annotations.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:23 +02:00
+								            backend: type[RateLimiterBackend] | None = TornadoInMemoryRateLimiterBackend
-												rate_limit: Implement IP-based rate limiting.

If the user is logged in, we'll stick to rate limiting by the
UserProfile. In case of requests without authentication, we'll apply the
same limits but to the IP address.

											
										
										
											2021-07-08 14:46:47 +02:00
+								        else:
 								            backend = None
 								        super().__init__(backend=backend)
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												rate_limit: Implement IP-based rate limiting.

If the user is logged in, we'll stick to rate limiting by the
UserProfile. In case of requests without authentication, we'll apply the
same limits but to the IP address.

											
										
										
											2021-07-08 14:46:47 +02:00
+								    def key(self) -> str:
 								        # The angle brackets are important since IPv6 addresses contain :.
 								        return f"{type(self).__name__}:<{self.ip_addr}>:{self.domain}"
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def rules(self) -> list[tuple[int, int]]:
-												rate_limit: Implement IP-based rate limiting.

If the user is logged in, we'll stick to rate limiting by the
UserProfile. In case of requests without authentication, we'll apply the
same limits but to the IP address.

											
										
										
											2021-07-08 14:46:47 +02:00
+								        return rules[self.domain]
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								class RateLimiterBackend(ABC):
 								    @classmethod
 								    @abstractmethod
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								    def block_access(cls, entity_key: str, seconds: int) -> None:
-												ruff: Fix Q002 Single quote docstring found.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-12-14 10:46:29 +01:00
+								        """Manually blocks an entity for the desired number of seconds"""
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
 								    @classmethod
 								    @abstractmethod
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								    def unblock_access(cls, entity_key: str) -> None:
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        pass
 								    @classmethod
 								    @abstractmethod
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								    def clear_history(cls, entity_key: str) -> None:
-												rate_limit: Remove inaccurate docstring on clear_history methods.

											
										
										
											2020-03-06 13:58:23 +01:00
+								        pass
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
 								    @classmethod
 								    @abstractmethod
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								    def get_api_calls_left(
 								        cls, entity_key: str, range_seconds: int, max_calls: int
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    ) -> tuple[int, float]:
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        pass
 								    @classmethod
 								    @abstractmethod
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								    def rate_limit_entity(
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								        cls, entity_key: str, rules: list[tuple[int, int]], max_api_calls: int, max_api_window: int
 								    ) -> tuple[bool, float]:
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        # Returns (ratelimited, secs_to_freedom)
 								        pass
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								class TornadoInMemoryRateLimiterBackend(RateLimiterBackend):
 								    # reset_times[rule][key] is the time at which the event
 								    # request from the rate-limited key will be accepted.
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    reset_times: dict[tuple[int, int], dict[str, float]] = {}
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
 								    # last_gc_time is the last time when the garbage was
 								    # collected from reset_times for rule (time_window, max_count).
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    last_gc_time: dict[tuple[int, int], float] = {}
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
 								    # timestamps_blocked_until[key] contains the timestamp
 								    # up to which the key has been blocked manually.
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    timestamps_blocked_until: dict[str, float] = {}
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
 								    @classmethod
 								    def _garbage_collect_for_rule(cls, now: float, time_window: int, max_count: int) -> None:
 								        keys_to_delete = []
 								        reset_times_for_rule = cls.reset_times.get((time_window, max_count), None)
 								        if reset_times_for_rule is None:
 								            return
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								        keys_to_delete = [
 								            entity_key
 								            for entity_key in reset_times_for_rule
 								            if reset_times_for_rule[entity_key] < now
 								        ]
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
 								        for entity_key in keys_to_delete:
 								            del reset_times_for_rule[entity_key]
 								        if not reset_times_for_rule:
 								            del cls.reset_times[(time_window, max_count)]
 								    @classmethod
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def need_to_limit(cls, entity_key: str, time_window: int, max_count: int) -> tuple[bool, float]:
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								        """
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								        Returns a tuple of `(rate_limited, time_till_free)`.
 								        For simplicity, we have loosened the semantics here from
-												codespell: Fix spelling mistakes caught by codespell.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-05-31 23:06:32 +02:00
+								        - each key may make at most `count * (t / window)` request within any t
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								          time interval.
 								        to
-												codespell: Fix spelling mistakes caught by codespell.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-05-31 23:06:32 +02:00
+								        - each key may make at most `count * [(t / window) + 1]` request within
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								          any t time interval.
 								        Thus, we only need to store reset_times for each key which will be less
 								        memory-intensive. This also has the advantage that you can only ever
 								        lock yourself out completely for `window / count` seconds instead of
 								        `window` seconds.
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								        """
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								        now = time.time()
 								        # Remove all timestamps from `reset_times` that are too old.
 								        if cls.last_gc_time.get((time_window, max_count), 0) <= now - time_window / max_count:
 								            cls.last_gc_time[(time_window, max_count)] = now
 								            cls._garbage_collect_for_rule(now, time_window, max_count)
 								        reset_times_for_rule = cls.reset_times.setdefault((time_window, max_count), {})
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								        new_reset = max(reset_times_for_rule.get(entity_key, now), now) + time_window / max_count
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
 								        if new_reset > now + time_window:
 								            # Compute for how long the bucket will remain filled.
 								            time_till_free = new_reset - time_window - now
 								            return True, time_till_free
 								        reset_times_for_rule[entity_key] = new_reset
 								        return False, 0.0
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								    def get_api_calls_left(
 								        cls, entity_key: str, range_seconds: int, max_calls: int
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    ) -> tuple[int, float]:
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								        now = time.time()
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								        if (range_seconds, max_calls) in cls.reset_times and entity_key in cls.reset_times[
 								            (range_seconds, max_calls)
 								        ]:
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								            reset_time = cls.reset_times[(range_seconds, max_calls)][entity_key]
 								        else:
 								            return max_calls, 0
 								        calls_remaining = (now + range_seconds - reset_time) * max_calls // range_seconds
 								        return int(calls_remaining), reset_time - now
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								    def block_access(cls, entity_key: str, seconds: int) -> None:
 								        now = time.time()
 								        cls.timestamps_blocked_until[entity_key] = now + seconds
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								    def unblock_access(cls, entity_key: str) -> None:
 								        del cls.timestamps_blocked_until[entity_key]
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								    def clear_history(cls, entity_key: str) -> None:
-												ruff: Fix PERF102 Using only the keys/values of a dict.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-07-31 22:16:30 +02:00
+								        for reset_times_for_rule in cls.reset_times.values():
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								            reset_times_for_rule.pop(entity_key, None)
 								        cls.timestamps_blocked_until.pop(entity_key, None)
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								    def rate_limit_entity(
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								        cls, entity_key: str, rules: list[tuple[int, int]], max_api_calls: int, max_api_window: int
 								    ) -> tuple[bool, float]:
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								        now = time.time()
 								        if entity_key in cls.timestamps_blocked_until:
 								            # Check whether the key is manually blocked.
 								            if now < cls.timestamps_blocked_until[entity_key]:
 								                blocking_ttl = cls.timestamps_blocked_until[entity_key] - now
 								                return True, blocking_ttl
 								            else:
 								                del cls.timestamps_blocked_until[entity_key]
-												rate_limiter: Handle edge case where rules list may be empty.

											
										
										
											2020-04-02 22:23:20 +02:00
+								        assert rules
-												rate_limiter: Add an in-process implementation for Tornado.

The Redis-based rate limiting approach takes a lot of time talking to
Redis with 3-4 network requests to Redis on each request.  It had a
negative impact on the performance of `get_events()` since this is our
single highest-traffic endpoint.

This commit introduces an in-process rate limiting alternate for
`/json/events` endpoint. The implementation uses Leaky Bucket
algorithm and Python dictionaries instead of Redis. This drops the
rate limiting time for `get_events()` from about 3000us to less than
100us (on my system).

Fixes #13913.

Co-Author-by: Mateusz Mandera <mateusz.mandera@protonmail.com>
Co-Author-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-03-19 16:10:31 +01:00
+								        for time_window, max_count in rules:
 								            ratelimited, time_till_free = cls.need_to_limit(entity_key, time_window, max_count)
 								            if ratelimited:
 								                break
 								        return ratelimited, time_till_free
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								class RedisRateLimiterBackend(RateLimiterBackend):
 								    @classmethod
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def get_keys(cls, entity_key: str) -> list[str]:
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								        return [
-												rate_limiter: Extract KEY_PREFIX to redis_utils.

											
										
										
											2024-03-19 02:46:33 +01:00
+								            f"{redis_utils.REDIS_KEY_PREFIX}ratelimit:{entity_key}:{keytype}"
 								            for keytype in ["list", "zset", "block"]
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								        ]
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								    def block_access(cls, entity_key: str, seconds: int) -> None:
-												ruff: Fix Q002 Single quote docstring found.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-12-14 10:46:29 +01:00
+								        """Manually blocks an entity for the desired number of seconds"""
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        _, _, blocking_key = cls.get_keys(entity_key)
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        with client.pipeline() as pipe:
 								            pipe.set(blocking_key, 1)
 								            pipe.expire(blocking_key, seconds)
 								            pipe.execute()
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								    def unblock_access(cls, entity_key: str) -> None:
 								        _, _, blocking_key = cls.get_keys(entity_key)
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        client.delete(blocking_key)
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								    def clear_history(cls, entity_key: str) -> None:
 								        for key in cls.get_keys(entity_key):
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								            client.delete(key)
 								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								    def get_api_calls_left(
 								        cls, entity_key: str, range_seconds: int, max_calls: int
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    ) -> tuple[int, float]:
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        list_key, set_key, _ = cls.get_keys(entity_key)
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        # Count the number of values in our sorted set
 								        # that are between now and the cutoff
 								        now = time.time()
 								        boundary = now - range_seconds
 								        with client.pipeline() as pipe:
 								            # Count how many API calls in our range have already been made
 								            pipe.zcount(set_key, boundary, now)
 								            # Get the newest call so we can calculate when the ratelimit
 								            # will reset to 0
 								            pipe.lindex(list_key, 0)
 								            results = pipe.execute()
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												python: Convert assignment type annotations to Python 3.6 style.

This commit was split by tabbott; this piece covers the vast majority
of files in Zulip, but excludes scripts/, tools/, and puppet/ to help
ensure we at least show the right error messages for Xenial systems.

We can likely further refine the remaining pieces with some testing.

Generated by com2ann, with whitespace fixes and various manual fixes
for runtime issues:

-    invoiced_through: Optional[LicenseLedger] = models.ForeignKey(
+    invoiced_through: Optional["LicenseLedger"] = models.ForeignKey(

-_apns_client: Optional[APNsClient] = None
+_apns_client: Optional["APNsClient"] = None

-    notifications_stream: Optional[Stream] = models.ForeignKey('Stream', related_name='+', null=True, blank=True, on_delete=CASCADE)
-    signup_notifications_stream: Optional[Stream] = models.ForeignKey('Stream', related_name='+', null=True, blank=True, on_delete=CASCADE)
+    notifications_stream: Optional["Stream"] = models.ForeignKey('Stream', related_name='+', null=True, blank=True, on_delete=CASCADE)
+    signup_notifications_stream: Optional["Stream"] = models.ForeignKey('Stream', related_name='+', null=True, blank=True, on_delete=CASCADE)

-    author: Optional[UserProfile] = models.ForeignKey('UserProfile', blank=True, null=True, on_delete=CASCADE)
+    author: Optional["UserProfile"] = models.ForeignKey('UserProfile', blank=True, null=True, on_delete=CASCADE)

-    bot_owner: Optional[UserProfile] = models.ForeignKey('self', null=True, on_delete=models.SET_NULL)
+    bot_owner: Optional["UserProfile"] = models.ForeignKey('self', null=True, on_delete=models.SET_NULL)

-    default_sending_stream: Optional[Stream] = models.ForeignKey('zerver.Stream', null=True, related_name='+', on_delete=CASCADE)
-    default_events_register_stream: Optional[Stream] = models.ForeignKey('zerver.Stream', null=True, related_name='+', on_delete=CASCADE)
+    default_sending_stream: Optional["Stream"] = models.ForeignKey('zerver.Stream', null=True, related_name='+', on_delete=CASCADE)
+    default_events_register_stream: Optional["Stream"] = models.ForeignKey('zerver.Stream', null=True, related_name='+', on_delete=CASCADE)

-descriptors_by_handler_id: Dict[int, ClientDescriptor] = {}
+descriptors_by_handler_id: Dict[int, "ClientDescriptor"] = {}

-worker_classes: Dict[str, Type[QueueProcessingWorker]] = {}
-queues: Dict[str, Dict[str, Type[QueueProcessingWorker]]] = {}
+worker_classes: Dict[str, Type["QueueProcessingWorker"]] = {}
+queues: Dict[str, Dict[str, Type["QueueProcessingWorker"]]] = {}

-AUTH_LDAP_REVERSE_EMAIL_SEARCH: Optional[LDAPSearch] = None
+AUTH_LDAP_REVERSE_EMAIL_SEARCH: Optional["LDAPSearch"] = None

Signed-off-by: Anders Kaseorg <anders@zulipchat.com>

											
										
										
											2020-04-22 01:09:50 +02:00
+								        count: int = results[0]
-												ruff: Fix UP007 Use `X | Y` for type annotations.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:23 +02:00
+								        newest_call: bytes | None = results[1]
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        calls_left = max_calls - count
 								        if newest_call is not None:
 								            time_reset = now + (range_seconds - (now - float(newest_call)))
 								        else:
 								            time_reset = now
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limiter: Fix secs_to_freedom being set to a timestamp.

time_reset returned from api_calls_left() was a timestamp, but
mistakenly treated as delta seconds. We change the return value of
api_calls_left() to be delta seconds, to be consistent with the return
value of rate_limit().

											
										
										
											2020-04-01 18:44:19 +02:00
+								        return calls_left, time_reset - now
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								    @classmethod
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def is_ratelimited(cls, entity_key: str, rules: list[tuple[int, int]]) -> tuple[bool, float]:
-												ruff: Fix Q002 Single quote docstring found.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-12-14 10:46:29 +01:00
+								        """Returns a tuple of (rate_limited, time_till_free)"""
-												rate_limiter: Handle edge case where rules list may be empty.

											
										
										
											2020-04-02 22:23:20 +02:00
+								        assert rules
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        list_key, set_key, blocking_key = cls.get_keys(entity_key)
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        # Go through the rules from shortest to longest,
 								        # seeing if this user has violated any of them. First
 								        # get the timestamps for each nth items
 								        with client.pipeline() as pipe:
 								            for _, request_count in rules:
 								                pipe.lindex(list_key, request_count - 1)  # 0-indexed list
 								            # Get blocking info
 								            pipe.get(blocking_key)
 								            pipe.ttl(blocking_key)
-												ruff: Fix UP007 Use `X | Y` for type annotations.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:23 +02:00
+								            rule_timestamps: list[bytes | None] = pipe.execute()
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
 								        # Check if there is a manual block on this API key
 								        blocking_ttl_b = rule_timestamps.pop()
 								        key_blocked = rule_timestamps.pop()
 								        if key_blocked is not None:
 								            # We are manually blocked. Report for how much longer we will be
-												test-backend: Remove rate_limiter from not_yet_fully_covered.

rate_limiter.py now has sufficient test coverage to remove from the
list of exclusions.

Tweaked by tabbott to handle @abstractmethod in a better way.

											
										
										
											2020-04-02 23:00:56 +02:00
+								            if blocking_ttl_b is None:  # nocoverage # defensive code, this should never happen
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                blocking_ttl = 0.5
 								            else:
 								                blocking_ttl = int(blocking_ttl_b)
 								            return True, blocking_ttl
 								        now = time.time()
-												ruff: Fix B905 `zip()` without an explicit `strict=` parameter.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:30 +02:00
+								        for timestamp, (range_seconds, num_requests) in zip(rule_timestamps, rules, strict=False):
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								            # Check if the nth timestamp is newer than the associated rule. If so,
 								            # it means we've hit our limit for this rule
 								            if timestamp is None:
 								                continue
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								            boundary = float(timestamp) + range_seconds
-												rate_limiter: Fix inconsistency in an edge case in redis limiter.

If we had a rule like "max 3 requests in 2 seconds", there was an
inconsistency between is_ratelimited() and get_api_calls_left().
If you had:
request #1 at time 0
request #2 and #3 at some times < 2

Next request, if exactly at time 2, would not get ratelimited, but if
get_api_calls_left was called, it would return 0. This was due to
inconsistency on the boundary - the check in is_ratelimited was
exclusive, while get_api_calls_left uses zcount, which is inclusive.

											
										
										
											2020-04-02 17:44:23 +02:00
+								            if boundary >= now:
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                free = boundary - now
 								                return True, free
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
+								        return False, 0.0
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								    @classmethod
-												rate_limiter: Handle edge case where rules list may be empty.

											
										
										
											2020-04-02 22:23:20 +02:00
+								    def incr_ratelimit(cls, entity_key: str, max_api_calls: int, max_api_window: int) -> None:
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        """Increases the rate-limit for the specified entity"""
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        list_key, set_key, _ = cls.get_keys(entity_key)
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        now = time.time()
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												docs: Fix more capitalization issues.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2020-10-23 02:43:28 +02:00
+								        # Start Redis transaction
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								        with client.pipeline() as pipe:
 								            count = 0
 								            while True:
 								                try:
 								                    # To avoid a race condition between getting the element we might trim from our list
 								                    # and removing it from our associated set, we abort this whole transaction if
 								                    # another agent manages to change our list out from under us
 								                    # When watching a value, the pipeline is set to Immediate mode
 								                    pipe.watch(list_key)
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    # Get the last elem that we'll trim (so we can remove it from our sorted set)
-												requirements: Upgrade Python requirements.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-07-03 02:47:21 +02:00
+								                    last_val = cast(  # mypy doesn’t know the pipe is in immediate mode
-												ruff: Fix UP007 Use `X | Y` for type annotations.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:23 +02:00
+								                        bytes | None, pipe.lindex(list_key, max_api_calls - 1)
-												requirements: Upgrade Python requirements.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-07-03 02:47:21 +02:00
+								                    )
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    # Restart buffered execution
 								                    pipe.multi()
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    # Add this timestamp to our list
 								                    pipe.lpush(list_key, now)
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    # Trim our list to the oldest rule we have
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								                    pipe.ltrim(list_key, 0, max_api_calls - 1)
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    # Add our new value to the sorted set that we keep
 								                    # We need to put the score and val both as timestamp,
 								                    # as we sort by score but remove by value
 								                    pipe.zadd(set_key, {str(now): now})
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    # Remove the trimmed value from our sorted set, if there was one
 								                    if last_val is not None:
 								                        pipe.zrem(set_key, last_val)
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    # Set the TTL for our keys as well
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								                    api_window = max_api_window
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    pipe.expire(list_key, api_window)
 								                    pipe.expire(set_key, api_window)
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    pipe.execute()
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    # If no exception was raised in the execution, there were no transaction conflicts
 								                    break
-												test-backend: Remove rate_limiter from not_yet_fully_covered.

rate_limiter.py now has sufficient test coverage to remove from the
list of exclusions.

Tweaked by tabbott to handle @abstractmethod in a better way.

											
										
										
											2020-04-02 23:00:56 +02:00
+								                except redis.WatchError:  # nocoverage # Ideally we'd have a test for this.
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    if count > 10:
-												ruff: Fix RSE102 Unnecessary parentheses on raised exception.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-02-04 02:07:20 +01:00
+								                        raise RateLimiterLockingError
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    count += 1
-												Properly calculate expiry of keys we add to Redis

(imported from commit 42fda34ed1cd1eb9411defa1c0cbf53ef0de7a7b)

											
										
										
											2013-06-05 22:32:23 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                    continue
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								    @classmethod
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								    def rate_limit_entity(
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								        cls, entity_key: str, rules: list[tuple[int, int]], max_api_calls: int, max_api_window: int
 								    ) -> tuple[bool, float]:
-												rate_limit: Refactor RateLimiterBackend to operate on keys and rules.

Instead of operating on RateLimitedObjects, and making the classes
depend on each too strongly. This also allows getting rid of get_keys()
function from RateLimitedObject, which was a redis rate limiter
implementation detail. RateLimitedObject should only define their own
key() function and the logic forming various necessary redis keys from
them should be in RedisRateLimiterBackend.

											
										
										
											2020-03-06 13:44:52 +01:00
+								        ratelimited, time = cls.is_ratelimited(entity_key, rules)
-												Add a rate limiting system to our backend

(imported from commit a1218618918b4dedc77307e2f277665e7dd8fa22)

											
										
										
											2013-05-29 23:58:07 +02:00
-												Remove statsd support.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-04-26 03:09:19 +02:00
+								        if not ratelimited:
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								            try:
-												rate_limiter: Handle edge case where rules list may be empty.

											
										
										
											2020-04-02 22:23:20 +02:00
+								                cls.incr_ratelimit(entity_key, max_api_calls, max_api_window)
-												ruff: Fix N818 exception name should be named with an Error suffix.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-11-17 09:30:48 +01:00
+								            except RateLimiterLockingError:
-												logging: Pass format arguments to logging.

https://docs.python.org/3/howto/logging.html#optimization

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2020-05-02 08:44:14 +02:00
+								                logger.warning("Deadlock trying to incr_ratelimit for %s", entity_key)
-												rate_limit: Add the concept of RateLimiterBackend.

This will allow easily swapping and using various implementations of
rate-limiting, and separate the implementation logic from
RateLimitedObjects.

											
										
										
											2020-03-05 13:38:20 +01:00
+								                # rate-limit users who are hitting the API so hard we can't update our stats.
 								                ratelimited = True
 								        return ratelimited, time
-												rate_limiter: Generalise some rate_limit_user code.

We create rate_limit_entity as a general rate-limiting function for
RateLimitedObjects, from code that was possible to abstract away from
rate_limit_user and that will be used for other kinds of rate limiting.
We make rate_limit_user use this new general framework from now.

											
										
										
											2019-03-23 18:33:37 +01:00
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
-												rate_limiter: Handle multiple types of rate limiting in middleware.

As more types of rate limiting of requests are added, one request may
end up having various limits applied to it - and the middleware needs to
be able to handle that. We implement that through a set_response_headers
function, which sets the X-RateLimit-* headers in a sensible way based
on all the limits that were applied to the request.

											
										
										
											2019-12-28 20:23:18 +01:00
+								class RateLimitResult:
-												python: Reformat with Black, except quotes.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2021-02-12 08:19:30 +01:00
+								    def __init__(
 								        self, entity: RateLimitedObject, secs_to_freedom: float, over_limit: bool, remaining: int
 								    ) -> None:
-												rate_limiter: Handle multiple types of rate limiting in middleware.

As more types of rate limiting of requests are added, one request may
end up having various limits applied to it - and the middleware needs to
be able to handle that. We implement that through a set_response_headers
function, which sets the X-RateLimit-* headers in a sensible way based
on all the limits that were applied to the request.

											
										
										
											2019-12-28 20:23:18 +01:00
+								        if over_limit:
 								            assert not remaining
 								        self.entity = entity
 								        self.secs_to_freedom = secs_to_freedom
 								        self.over_limit = over_limit
 								        self.remaining = remaining
-												upload: Allow rate limited access to spectators for uploaded files.

We allow spectators access to uploaded files in web public streams
but rate limit the daily requests to 1000 per file by default.

											
										
										
											2021-11-02 15:42:58 +01:00
 								class RateLimitedSpectatorAttachmentAccessByFile(RateLimitedObject):
 								    def __init__(self, path_id: str) -> None:
 								        self.path_id = path_id
 								        super().__init__()
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												upload: Allow rate limited access to spectators for uploaded files.

We allow spectators access to uploaded files in web public streams
but rate limit the daily requests to 1000 per file by default.

											
										
										
											2021-11-02 15:42:58 +01:00
+								    def key(self) -> str:
 								        return f"{type(self).__name__}:{self.path_id}"
-												mypy: Enable new error explicit-override.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2023-10-12 19:43:45 +02:00
+								    @override
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								    def rules(self) -> list[tuple[int, int]]:
-												upload: Allow rate limited access to spectators for uploaded files.

We allow spectators access to uploaded files in web public streams
but rate limit the daily requests to 1000 per file by default.

											
										
										
											2021-11-02 15:42:58 +01:00
+								        return settings.RATE_LIMITING_RULES["spectator_attachment_access_by_file"]
 								def rate_limit_spectator_attachment_access_by_file(path_id: str) -> None:
 								    ratelimited, _ = RateLimitedSpectatorAttachmentAccessByFile(path_id).rate_limit()
 								    if ratelimited:
-												ruff: Fix N818 exception name should be named with an Error suffix.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-11-17 09:30:48 +01:00
+								        raise RateLimitedError
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
 								def is_local_addr(addr: str) -> bool:
 								    return addr in ("127.0.0.1", "::1")
 								@cache_with_key(lambda: "tor_ip_addresses:", timeout=60 * 60)
 								@circuit(failure_threshold=2, recovery_timeout=60 * 10)
-												ruff: Fix UP006 Use `list` instead of `List` for type annotation.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2024-07-12 02:30:17 +02:00
+								def get_tor_ips() -> set[str]:
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
+								    if not settings.RATE_LIMIT_TOR_TOGETHER:
 								        return set()
 								    # Cron job in /etc/cron.d/fetch-tor-exit-nodes fetches this
 								    # hourly; we cache it in memcached to prevent going to disk on
 								    # every unauth'd request.  In case of failures to read, we
 								    # circuit-break so 2 failures cause a 10-minute backoff.
 								    with open(settings.TOR_EXIT_NODE_FILE_PATH, "rb") as f:
 								        exit_node_list = orjson.loads(f.read())
 								    # This should always be non-empty; if it's empty, assume something
 								    # went wrong with writing and treat it as a non-existent file.
 								    # Circuit-breaking will ensure that we back off on re-reading the
 								    # file.
 								    if len(exit_node_list) == 0:
 								        raise OSError("File is empty")
 								    return set(exit_node_list)
 								def client_is_exempt_from_rate_limiting(request: HttpRequest) -> bool:
 								    from zerver.lib.request import RequestNotes
 								    # Don't rate limit requests from Django that come from our own servers,
 								    # and don't rate-limit dev instances
 								    client = RequestNotes.get_notes(request).client
 								    return (client is not None and client.name.lower() == "internal") and (
 								        is_local_addr(request.META["REMOTE_ADDR"]) or settings.DEBUG_RATE_LIMITING
 								    )
 								def rate_limit_user(request: HttpRequest, user: UserProfile, domain: str) -> None:
-												ruff: Fix N818 exception name should be named with an Error suffix.

Signed-off-by: Anders Kaseorg <anders@zulip.com>

											
										
										
											2022-11-17 09:30:48 +01:00
+								    """Returns whether or not a user was rate limited. Will raise a RateLimitedError exception
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
+								    if the user has been rate limited, otherwise returns and modifies request to contain
 								    the rate limit information"""
-												rate_limit: Replace rate_limit with inlined rate limit checks.

This change incorporate should_rate_limit into rate_limit_user and
rate_limit_request_by_ip. Note a slight behavior change to other callers
to rate_limit_request_by_ip is made as we now check if the client is
eligible to be exempted from rate limiting now, which was previously
only done as a part of zerver.lib.rate_limiter.rate_limit.

Now we mock zerver.lib.rate_limiter.RateLimitedUser instead of
zerver.decorator.rate_limit_user in
zerver.tests.test_decorators.RateLimitTestCase, because rate_limit_user
will always be called but rate limit only happens the should_rate_limit
check passes;

we can continue to mock zerver.lib.rate_limiter.rate_limit_ip, because the
decorated view functions call rate_limit_request_by_ip that calls
rate_limit_ip when the should_rate_limit check passes.

We need to mock zerver.decorator.rate_limit_user for SkipRateLimitingTest
now because rate_limit has been removed. We don't need to mock
RateLimitedUser in this case because we are only verifying that
the skip_rate_limiting flag works.

To ensure coverage in add_logging_data, a new test case is added to use
a web_public_view (which decorates the view function with
add_logging_data) with a new flag to check_rate_limit_public_or_user_views.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-14 21:14:52 +02:00
+								    if not should_rate_limit(request):
 								        return
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
 								    RateLimitedUser(user, domain=domain).rate_limit_request(request)
 								def rate_limit_request_by_ip(request: HttpRequest, domain: str) -> None:
-												rate_limit: Replace rate_limit with inlined rate limit checks.

This change incorporate should_rate_limit into rate_limit_user and
rate_limit_request_by_ip. Note a slight behavior change to other callers
to rate_limit_request_by_ip is made as we now check if the client is
eligible to be exempted from rate limiting now, which was previously
only done as a part of zerver.lib.rate_limiter.rate_limit.

Now we mock zerver.lib.rate_limiter.RateLimitedUser instead of
zerver.decorator.rate_limit_user in
zerver.tests.test_decorators.RateLimitTestCase, because rate_limit_user
will always be called but rate limit only happens the should_rate_limit
check passes;

we can continue to mock zerver.lib.rate_limiter.rate_limit_ip, because the
decorated view functions call rate_limit_request_by_ip that calls
rate_limit_ip when the should_rate_limit check passes.

We need to mock zerver.decorator.rate_limit_user for SkipRateLimitingTest
now because rate_limit has been removed. We don't need to mock
RateLimitedUser in this case because we are only verifying that
the skip_rate_limiting flag works.

To ensure coverage in add_logging_data, a new test case is added to use
a web_public_view (which decorates the view function with
add_logging_data) with a new flag to check_rate_limit_public_or_user_views.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-14 21:14:52 +02:00
+								    if not should_rate_limit(request):
 								        return
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
+								    # REMOTE_ADDR is set by SetRemoteAddrFromRealIpHeader in conjunction
 								    # with the nginx configuration to guarantee this to be *the* correct
 								    # IP address to use - without worrying we'll grab the IP of a proxy.
 								    ip_addr = request.META["REMOTE_ADDR"]
 								    assert ip_addr
 								    try:
 								        # We lump all TOR exit nodes into one bucket; this prevents
 								        # abuse from TOR, while still allowing some access to these
 								        # endpoints for legitimate users.  Checking for local
 								        # addresses is a shortcut somewhat for ease of testing without
 								        # mocking the TOR endpoint in every test.
 								        if is_local_addr(ip_addr):
 								            pass
 								        elif ip_addr in get_tor_ips():
 								            ip_addr = "tor-exit-node"
 								    except (OSError, CircuitBreakerError) as err:
 								        # In the event that we can't get an updated list of TOR exit
 								        # nodes, assume the IP is _not_ one, and leave it unchanged.
 								        # We log a warning so that this endpoint being taken out of
 								        # service doesn't silently remove this functionality.
 								        logger.warning("Failed to fetch TOR exit node list: %s", err)
-												rate_limit: Remove rate_limit_ip.

Because rate_limit_request_by_ip is the only caller of it, it is safe
for us to inline RateLimitedIpAddr and remove this helper. This ensures
that we have consistent internals for rate limiting functions, which all
have a should_rate_limit check.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-17 16:22:26 +02:00
+								    RateLimitedIPAddr(ip_addr, domain=domain).rate_limit_request(request)
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
-												rate_limit: Extract should_rate_limit from rate_limit.

This allows us to reapply this check for other rate limiting functions.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-14 01:06:09 +02:00
+								def should_rate_limit(request: HttpRequest) -> bool:
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
+								    if not settings.RATE_LIMITING:
-												rate_limit: Extract should_rate_limit from rate_limit.

This allows us to reapply this check for other rate limiting functions.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-14 01:06:09 +02:00
+								        return False
-												rate_limiter: Extract rate limit related functions.

This refactors rate limit related functions from `zerver.decorator` to
zerver.lib.rate_limiter.

We conditionally import `RemoteZulipServer`, `RequestNotes`, and
`RateLimitedRemoteZulipServer` to avoid circular dependency.

Most instances of importing these functions from `zerver.decorator` got
updated, with a few exceptions in `zerver.tests.test_decorators`, where
we do want to mock the rate limiting functions imported in
`zerver.decorator`. The same goes with the mocking example in the
"testing-with-django" documentation.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-05 17:40:03 +02:00
 								    if client_is_exempt_from_rate_limiting(request):
-												rate_limit: Extract should_rate_limit from rate_limit.

This allows us to reapply this check for other rate limiting functions.

Signed-off-by: Zixuan James Li <p359101898@gmail.com>

											
										
										
											2022-08-14 01:06:09 +02:00
+								        return False
 								    return True