Project Files

.claude

settings.local.json

src

bing

build-urls.ts

index.ts

parse-results.ts

search-images.ts

cache

image-search-results-payload.ts

index.ts

search-cache-key.ts

ttl-cache.ts

web-search-results-payload.ts

config

auto-sentinel.ts

config-defaults.ts

config-schematics.ts

resolve-config.ts

duckduckgo

build-urls.ts

index.ts

parse-results.ts

search-web.ts

web-search-result.ts

enrichment

enrich-search-results.ts

index.ts

metascraper-helpers.d.ts

metascraper.ts

errors

abort-error.ts

error-message.ts

index.ts

no-results-error.ts

tool-error.ts

unsupported-content-type-error.ts

index.ts

lmstudio-home.ts

markdown-path.ts

url-filename.ts

http

challenge.ts

decode.ts

fetch-error.ts

fetch-retry.ts

fetch.ts

impit-client.ts

impit-error.ts

index.ts

parse-content-type.ts

redirects.ts

response-body.ts

ssrf.ts

url-schema.ts

url.ts

images

download-image.ts

download-images.ts

index.ts

page

fetch-page.ts

fetched-page.ts

index.ts

page-kind.ts

parsers

image-extensions.ts

index.ts

page-images.ts

page-text.ts

parse-html.ts

pdf-text.ts

renderers

image-results.ts

index.ts

page-result.ts

retrieval

chunking.ts

excerpt.ts

index.ts

relevance.ts

selection.ts

index.ts

safe-search.ts

search-page-parameter.ts

text

escape-markdown.ts

html-to-markdown.ts

html-to-text.ts

index.ts

normalize-blank-lines.ts

normalize-text.ts

timing

index.ts

per-host-rate-limiter.ts

rate-limiter.ts

tools

fetch-images-tool.ts

image-search-tool.ts

visit-website-tool.ts

web-search-tool.ts

index.ts

tools-provider.ts

.gitignore

.prettierrc.json

CLAUDE.md

eslint.config.mjs

knip.json

LICENSE

manifest.json

package-lock.json

package.json

QWEN.md

README.md

thumbnail.png

tsconfig.json

tsdoc.json

src / timing / per-host-rate-limiter.ts

/**
 * Per-host rate limiter built on `Bottleneck.Group`. Each unique URL host gets its own
 * underlying Bottleneck limiter, so calls to different hosts run concurrently while calls
 * to the same host still observe the configured minimum interval. Idle per-host limiters
 * are automatically reaped by Bottleneck after their TTL elapses.
 */

import Bottleneck from "bottleneck"

/**
 * Construction options for `PerHostRateLimiter`.
 */
export interface PerHostRateLimiterOptions {
  /** Minimum gap enforced between successive scheduled operations against the same host, in milliseconds. */
  minIntervalMs: number
  /** Maximum number of operations allowed to run concurrently against a single host. Defaults to `1`. */
  maxConcurrentPerHost?: number
}

/**
 * Enforces a minimum interval between requests targeted at the same host while permitting
 * concurrent requests across distinct hosts. Falls back to the raw URL string as the
 * limiter key when host extraction fails so an unparseable URL still observes serialisation
 * with itself rather than racing free.
 */
export class PerHostRateLimiter {
  /** Underlying Bottleneck group that lazily mints a per-key limiter on demand. */
  private readonly group: Bottleneck.Group

  /**
   * Create a per-host limiter configured with the given interval and concurrency cap.
   *
   * @param options - Limiter configuration. `maxConcurrentPerHost` defaults to `1` so calls to a single host serialise; configure higher when downstream tolerates parallel access.
   */
  public constructor(options: PerHostRateLimiterOptions) {
    this.group = new Bottleneck.Group({
      minTime: options.minIntervalMs,
      maxConcurrent: options.maxConcurrentPerHost ?? 1,
    })
  }

  /**
   * Await the minimum interval against the host extracted from `url`, returning once the
   * caller is cleared to issue an outbound request to that host. A placeholder task is scheduled
   * purely to consume an interval slot, so the gap is enforced between successive `wait()`
   * resolutions for the host (request *initiations*), not between request completions. Calls to
   * different hosts resolve independently and may proceed concurrently.
   *
   * @param url - URL whose host scopes the wait.
   * @returns A promise that resolves once the caller is cleared to proceed.
   */
  public async wait(url: string): Promise<void> {
    await this.group.key(hostKey(url)).schedule(async () => {
      /* placeholder task: scheduling it consumes one interval slot */
    })
  }
}

/**
 * Derive a stable per-host key from a URL string, falling back to the raw input when the
 * URL is unparseable. The fallback is namespaced so a malformed URL cannot collide with a
 * legitimate host name.
 *
 * @param url - URL string to derive the key from.
 * @returns A stable key suitable for `Bottleneck.Group.key`.
 */
function hostKey(url: string): string {
  try {
    return new URL(url).host
  } catch {
    return `__unparseable__:${url}`
  }
}

web-tools