Merge branch 'pr-36' (rate limiting) into 0.0.3-draft

Combined MAX_RESPONSE_SIZE dynamic calculation with RateLimiter class.
security(polymarket-browse): add token bucket rate limiter for API calls
2026-03-27 02:28:16 +00:00 · 2026-03-26 19:15:02 +00:00
1 changed files with 35 additions and 1 deletions
--- a/skills/polymarket-browse/scripts/browse.py
+++ b/skills/polymarket-browse/scripts/browse.py
@@ -11,6 +11,7 @@ import time
 import argparse
 import hashlib
 import os
 import threading
 from concurrent.futures import ThreadPoolExecutor, as_completed
 from datetime import datetime, timezone, timedelta
 from typing import Any, Callable, TypedDict
@@ -101,6 +102,8 @@ INITIAL_RETRY_DELAY = 2  # exponential backoff starts at 2s
 MAX_RESPONSE_SIZE_MULTIPLIER = 10  # Response size limit = PAGE_SIZE * multiplier
 MAX_RESPONSE_SIZE_MIN = 10 * 1024 * 1024  # 10MB minimum
 MAX_RESPONSE_SIZE_MAX = 100 * 1024 * 1024  # 100MB maximum for safety
 RATE_LIMIT_CALLS = 10  # max API calls
 RATE_LIMIT_WINDOW = 1.0  # per second
 WIB = timezone(timedelta(hours=7))  # UTC+7 for Indonesian users
 _DISPLAY_TZ = WIB  # Module-level timezone for display (configurable via --timezone)
@@ -142,7 +145,6 @@ def parse_timezone(tz_str: str) -> timezone:
        return WIB
 def get_max_response_size(page_size: int = PAGE_SIZE) -> int:
    """
    Calculate max response size based on expected payload.
@@ -154,6 +156,37 @@ def get_max_response_size(page_size: int = PAGE_SIZE) -> int:
    return min(size, MAX_RESPONSE_SIZE_MAX)
 class RateLimiter:
    """Token bucket rate limiter for API calls. Thread-safe for use with ThreadPoolExecutor."""
    def __init__(
        self, calls: int = RATE_LIMIT_CALLS, window: float = RATE_LIMIT_WINDOW
    ):
        self.calls = calls
        self.window = window
        self.tokens = float(calls)
        self.last_update = time.monotonic()
        self._lock = threading.Lock()
    def acquire(self) -> None:
        """Block until a token is available."""
        with self._lock:
            now = time.monotonic()
            elapsed = now - self.last_update
            self.tokens = min(
                self.calls, self.tokens + elapsed * (self.calls / self.window)
            )
            if self.tokens < 1:
                wait_time = (1 - self.tokens) * (self.window / self.calls)
                time.sleep(wait_time)
                self.tokens = 0
            else:
                self.tokens -= 1
            self.last_update = time.monotonic()
 _rate_limiter = RateLimiter()
 GAME_CATEGORIES = {
    "All Esports": "Esports",
    "Counter Strike": "Counter Strike",
@@ -231,6 +264,7 @@ def fetch_page(
        if attempt > 0:
            time.sleep(delay)
        try:
            _rate_limiter.acquire()
            req = Request(url, headers={"User-Agent": "Mozilla/5.0"})
            with urlopen(req, timeout=10) as r:
                data = r.read()