aisearch_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

cache: Optional[bool]

cache_threshold: Optional[Literal["super_strict_match", "close_enough", "flexible_friend", "anything_goes"]]

One of the following:

"super_strict_match"

"close_enough"

"flexible_friend"

"anything_goes"

cache_ttl: Optional[Literal[600, 1800, 3600, 7 more]]

Cache entry TTL in seconds. Allowed values: 600 (10min), 1800 (30min), 3600 (1h), 7200 (2h), 21600 (6h), 43200 (12h), 86400 (24h), 172800 (48h), 259200 (72h), 518400 (6d).

One of the following:

600

1800

3600

7200

21600

43200

86400

172800

259200

518400

chunk_overlap: Optional[int]

maximum30

minimum0

chunk_size: Optional[int]

minimum64

created_by: Optional[str]

custom_metadata: Optional[List[CustomMetadata]]

data_type: Literal["text", "number", "boolean", "datetime"]

One of the following:

"text"

"number"

"boolean"

"datetime"

field_name: str

maxLength64

minLength1

embedding_model: Optional[Literal["@cf/qwen/qwen3-embedding-0.6b", "@cf/qwen/qwen3-vl-embedding-2b", "@cf/baai/bge-m3", 8 more]]

One of the following:

"@cf/qwen/qwen3-embedding-0.6b"

"@cf/qwen/qwen3-vl-embedding-2b"

"@cf/baai/bge-m3"

"@cf/baai/bge-large-en-v1.5"

"@cf/google/embeddinggemma-300m"

"google-ai-studio/gemini-embedding-001"

"google-ai-studio/gemini-embedding-2-preview"

"google-ai-studio/gemini-embedding-2"

"openai/text-embedding-3-small"

"openai/text-embedding-3-large"

enable: Optional[bool]

engine_version: Optional[float]

fusion_method: Optional[Literal["max", "rrf"]]

One of the following:

"max"

"rrf"

Deprecatedhybrid_search_enabled: Optional[bool]

Deprecated — use index_method instead.

index_method: Optional[IndexMethod]

Controls which storage backends are used during indexing. Defaults to vector-only.

keyword: bool

Enable keyword (BM25) storage backend.

vector: bool

Enable vector (embedding) storage backend.

indexing_options: Optional[IndexingOptions]

keyword_tokenizer: Optional[Literal["porter", "trigram"]]

Tokenizer used for keyword search indexing. porter provides word-level tokenization with Porter stemming (good for natural language queries). trigram enables character-level substring matching (good for partial matches, code, identifiers). Changing this triggers a full re-index. Defaults to porter.

One of the following:

"porter"

"trigram"

last_activity: Optional[datetime]

formatdate-time

max_num_results: Optional[int]

maximum50

minimum1

metadata: Optional[Metadata]

created_from_aisearch_wizard: Optional[bool]

worker_domain: Optional[str]

modified_by: Optional[str]

namespace: Optional[str]

paused: Optional[bool]

public_endpoint_id: Optional[str]

public_endpoint_params: Optional[PublicEndpointParams]

authorized_hosts: Optional[List[str]]

chat_completions_endpoint: Optional[PublicEndpointParamsChatCompletionsEndpoint]

disabled: Optional[bool]

Disable chat completions endpoint for this public endpoint

custom_domains: Optional[List[str]]

Custom domain hostnames that alias this public endpoint. GET and create responses return the current set; on update (PUT) this field is only echoed back when supplied in the request body, otherwise it is null (omit it to leave domains unchanged).

enabled: Optional[bool]

mcp: Optional[PublicEndpointParamsMcp]

description: Optional[str]

disabled: Optional[bool]

Disable MCP endpoint for this public endpoint

rate_limit: Optional[PublicEndpointParamsRateLimit]

period_ms: Optional[int]

maximum3600000

minimum60000

requests: Optional[int]

minimum1

technique: Optional[Literal["fixed", "sliding"]]

One of the following:

"fixed"

"sliding"

search_endpoint: Optional[PublicEndpointParamsSearchEndpoint]

disabled: Optional[bool]

Disable search endpoint for this public endpoint

reranking: Optional[bool]

reranking_model: Optional[Literal["@cf/baai/bge-reranker-base", ""]]

One of the following:

"@cf/baai/bge-reranker-base"

retrieval_options: Optional[RetrievalOptions]

boost_by: Optional[List[RetrievalOptionsBoostBy]]

Metadata fields to boost search results by. Each entry specifies a metadata field and an optional direction. Direction defaults to ‘asc’ for numeric/datetime fields and ‘exists’ for text/boolean fields. Fields must match ‘timestamp’ or a defined custom_metadata field.

field: str

Metadata field name to boost by. Use ‘timestamp’ for document freshness, or any custom_metadata field. Numeric and datetime fields support all four directions (asc, desc, exists, not_exists); text/boolean fields only support exists/not_exists.

maxLength64

minLength1

direction: Optional[Literal["asc", "desc", "exists", "not_exists"]]

Boost direction. ‘desc’ = higher values rank higher (e.g. newer timestamps). ‘asc’ = lower values rank higher. ‘exists’ = boost chunks that have the field. ‘not_exists’ = boost chunks that lack the field. Optional — defaults to ‘asc’ for numeric/datetime fields, ‘exists’ for text/boolean fields.

One of the following:

"asc"

"desc"

"exists"

"not_exists"

keyword_match_mode: Optional[Literal["and", "or"]]

Controls which documents are candidates for BM25 scoring. ‘and’ restricts candidates to documents containing all query terms; ‘or’ includes any document containing at least one term, ranked by BM25 relevance. Defaults to ‘and’.

One of the following:

"and"

"or"

rewrite_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

rewrite_query: Optional[bool]

score_threshold: Optional[float]

maximum1

minimum0

source: Optional[str]

source_params: Optional[SourceParams]

exclude_items: Optional[List[str]]

List of path patterns to exclude. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /admin/** matches /admin/users and /admin/settings/advanced)

include_items: Optional[List[str]]

List of path patterns to include. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /blog/** matches /blog/post and /blog/2024/post)

prefix: Optional[str]

r2_jurisdiction: Optional[str]

web_crawler: Optional[SourceParamsWebCrawler]

parse_options: Optional[SourceParamsWebCrawlerParseOptions]

content_selector: Optional[List[SourceParamsWebCrawlerParseOptionsContentSelector]]

List of path-to-selector mappings for extracting specific content from crawled pages. Each entry pairs a URL glob pattern with a CSS selector. The first matching path wins. Only the matched HTML fragment is stored and indexed. Omit the field to disable content selection — empty arrays are rejected.

path: str

Glob pattern to match against the page URL path. Uses standard glob syntax: * matches within a segment, ** crosses directories.

maxLength200

minLength1

selector: str

CSS selector to extract content from pages matching the path pattern. Must not contain disallowed characters (;, `, $, {, }, ). Must target a single element; if multiple elements match, the selector is ignored and the full page is used.

maxLength200

minLength1

include_headers: Optional[Dict[str, str]]

Up to 5 custom HTTP headers sent with each crawl request. Names must be RFC-7230 token characters (no spaces, colons, or control characters); values must be HTAB + printable ASCII (no CR/LF).

include_images: Optional[bool]

specific_sitemaps: Optional[List[str]]

List of specific sitemap URLs to use for crawling. Only valid when parse_type is ‘sitemap’.

use_browser_rendering: Optional[bool]

parse_type: Optional[Literal["sitemap", "crawl"]]

One of the following:

"sitemap"

"crawl"

status: Optional[str]

sync_interval: Optional[Literal[900, 1800, 3600, 5 more]]

Interval between automatic syncs, in seconds. Allowed values: 900 (15min), 1800 (30min), 3600 (1h), 7200 (2h), 14400 (4h), 21600 (6h), 43200 (12h), 86400 (24h).

One of the following:

900

1800

3600

7200

14400

21600

43200

86400

token_id: Optional[str]

formatuuid

type: Optional[Literal["r2", "web-crawler"]]

One of the following:

"r2"

"web-crawler"

class InstanceCreateResponse: …

id: str

AI Search instance ID. Lowercase alphanumeric, hyphens, and underscores.

maxLength64

minLength1

created_at: datetime

formatdate-time

modified_at: datetime

formatdate-time

ai_gateway_id: Optional[str]

aisearch_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

cache: Optional[bool]

cache_threshold: Optional[Literal["super_strict_match", "close_enough", "flexible_friend", "anything_goes"]]

One of the following:

"super_strict_match"

"close_enough"

"flexible_friend"

"anything_goes"

cache_ttl: Optional[Literal[600, 1800, 3600, 7 more]]

Cache entry TTL in seconds. Allowed values: 600 (10min), 1800 (30min), 3600 (1h), 7200 (2h), 21600 (6h), 43200 (12h), 86400 (24h), 172800 (48h), 259200 (72h), 518400 (6d).

One of the following:

600

1800

3600

7200

21600

43200

86400

172800

259200

518400

chunk_overlap: Optional[int]

maximum30

minimum0

chunk_size: Optional[int]

minimum64

created_by: Optional[str]

custom_metadata: Optional[List[CustomMetadata]]

data_type: Literal["text", "number", "boolean", "datetime"]

One of the following:

"text"

"number"

"boolean"

"datetime"

field_name: str

maxLength64

minLength1

embedding_model: Optional[Literal["@cf/qwen/qwen3-embedding-0.6b", "@cf/qwen/qwen3-vl-embedding-2b", "@cf/baai/bge-m3", 8 more]]

One of the following:

"@cf/qwen/qwen3-embedding-0.6b"

"@cf/qwen/qwen3-vl-embedding-2b"

"@cf/baai/bge-m3"

"@cf/baai/bge-large-en-v1.5"

"@cf/google/embeddinggemma-300m"

"google-ai-studio/gemini-embedding-001"

"google-ai-studio/gemini-embedding-2-preview"

"google-ai-studio/gemini-embedding-2"

"openai/text-embedding-3-small"

"openai/text-embedding-3-large"

enable: Optional[bool]

engine_version: Optional[float]

fusion_method: Optional[Literal["max", "rrf"]]

One of the following:

"max"

"rrf"

Deprecatedhybrid_search_enabled: Optional[bool]

Deprecated — use index_method instead.

index_method: Optional[IndexMethod]

Controls which storage backends are used during indexing. Defaults to vector-only.

keyword: bool

Enable keyword (BM25) storage backend.

vector: bool

Enable vector (embedding) storage backend.

indexing_options: Optional[IndexingOptions]

keyword_tokenizer: Optional[Literal["porter", "trigram"]]

One of the following:

"porter"

"trigram"

last_activity: Optional[datetime]

formatdate-time

max_num_results: Optional[int]

maximum50

minimum1

metadata: Optional[Metadata]

created_from_aisearch_wizard: Optional[bool]

worker_domain: Optional[str]

modified_by: Optional[str]

namespace: Optional[str]

paused: Optional[bool]

public_endpoint_id: Optional[str]

public_endpoint_params: Optional[PublicEndpointParams]

authorized_hosts: Optional[List[str]]

chat_completions_endpoint: Optional[PublicEndpointParamsChatCompletionsEndpoint]

disabled: Optional[bool]

Disable chat completions endpoint for this public endpoint

custom_domains: Optional[List[str]]

enabled: Optional[bool]

mcp: Optional[PublicEndpointParamsMcp]

description: Optional[str]

disabled: Optional[bool]

Disable MCP endpoint for this public endpoint

rate_limit: Optional[PublicEndpointParamsRateLimit]

period_ms: Optional[int]

maximum3600000

minimum60000

requests: Optional[int]

minimum1

technique: Optional[Literal["fixed", "sliding"]]

One of the following:

"fixed"

"sliding"

search_endpoint: Optional[PublicEndpointParamsSearchEndpoint]

disabled: Optional[bool]

Disable search endpoint for this public endpoint

reranking: Optional[bool]

reranking_model: Optional[Literal["@cf/baai/bge-reranker-base", ""]]

One of the following:

"@cf/baai/bge-reranker-base"

retrieval_options: Optional[RetrievalOptions]

boost_by: Optional[List[RetrievalOptionsBoostBy]]

field: str

maxLength64

minLength1

direction: Optional[Literal["asc", "desc", "exists", "not_exists"]]

One of the following:

"asc"

"desc"

"exists"

"not_exists"

keyword_match_mode: Optional[Literal["and", "or"]]

One of the following:

"and"

"or"

rewrite_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

rewrite_query: Optional[bool]

score_threshold: Optional[float]

maximum1

minimum0

source: Optional[str]

source_params: Optional[SourceParams]

exclude_items: Optional[List[str]]

List of path patterns to exclude. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /admin/** matches /admin/users and /admin/settings/advanced)

include_items: Optional[List[str]]

List of path patterns to include. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /blog/** matches /blog/post and /blog/2024/post)

prefix: Optional[str]

r2_jurisdiction: Optional[str]

web_crawler: Optional[SourceParamsWebCrawler]

parse_options: Optional[SourceParamsWebCrawlerParseOptions]

content_selector: Optional[List[SourceParamsWebCrawlerParseOptionsContentSelector]]

path: str

Glob pattern to match against the page URL path. Uses standard glob syntax: * matches within a segment, ** crosses directories.

maxLength200

minLength1

selector: str

maxLength200

minLength1

include_headers: Optional[Dict[str, str]]

Up to 5 custom HTTP headers sent with each crawl request. Names must be RFC-7230 token characters (no spaces, colons, or control characters); values must be HTAB + printable ASCII (no CR/LF).

include_images: Optional[bool]

specific_sitemaps: Optional[List[str]]

List of specific sitemap URLs to use for crawling. Only valid when parse_type is ‘sitemap’.

use_browser_rendering: Optional[bool]

parse_type: Optional[Literal["sitemap", "crawl"]]

One of the following:

"sitemap"

"crawl"

status: Optional[str]

sync_interval: Optional[Literal[900, 1800, 3600, 5 more]]

Interval between automatic syncs, in seconds. Allowed values: 900 (15min), 1800 (30min), 3600 (1h), 7200 (2h), 14400 (4h), 21600 (6h), 43200 (12h), 86400 (24h).

One of the following:

900

1800

3600

7200

14400

21600

43200

86400

token_id: Optional[str]

formatuuid

type: Optional[Literal["r2", "web-crawler"]]

One of the following:

"r2"

"web-crawler"

class InstanceReadResponse: …

id: str

AI Search instance ID. Lowercase alphanumeric, hyphens, and underscores.

maxLength64

minLength1

created_at: datetime

formatdate-time

modified_at: datetime

formatdate-time

ai_gateway_id: Optional[str]

aisearch_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

cache: Optional[bool]

cache_threshold: Optional[Literal["super_strict_match", "close_enough", "flexible_friend", "anything_goes"]]

One of the following:

"super_strict_match"

"close_enough"

"flexible_friend"

"anything_goes"

cache_ttl: Optional[Literal[600, 1800, 3600, 7 more]]

Cache entry TTL in seconds. Allowed values: 600 (10min), 1800 (30min), 3600 (1h), 7200 (2h), 21600 (6h), 43200 (12h), 86400 (24h), 172800 (48h), 259200 (72h), 518400 (6d).

One of the following:

600

1800

3600

7200

21600

43200

86400

172800

259200

518400

chunk_overlap: Optional[int]

maximum30

minimum0

chunk_size: Optional[int]

minimum64

created_by: Optional[str]

custom_metadata: Optional[List[CustomMetadata]]

data_type: Literal["text", "number", "boolean", "datetime"]

One of the following:

"text"

"number"

"boolean"

"datetime"

field_name: str

maxLength64

minLength1

embedding_model: Optional[Literal["@cf/qwen/qwen3-embedding-0.6b", "@cf/qwen/qwen3-vl-embedding-2b", "@cf/baai/bge-m3", 8 more]]

One of the following:

"@cf/qwen/qwen3-embedding-0.6b"

"@cf/qwen/qwen3-vl-embedding-2b"

"@cf/baai/bge-m3"

"@cf/baai/bge-large-en-v1.5"

"@cf/google/embeddinggemma-300m"

"google-ai-studio/gemini-embedding-001"

"google-ai-studio/gemini-embedding-2-preview"

"google-ai-studio/gemini-embedding-2"

"openai/text-embedding-3-small"

"openai/text-embedding-3-large"

enable: Optional[bool]

engine_version: Optional[float]

fusion_method: Optional[Literal["max", "rrf"]]

One of the following:

"max"

"rrf"

Deprecatedhybrid_search_enabled: Optional[bool]

Deprecated — use index_method instead.

index_method: Optional[IndexMethod]

Controls which storage backends are used during indexing. Defaults to vector-only.

keyword: bool

Enable keyword (BM25) storage backend.

vector: bool

Enable vector (embedding) storage backend.

indexing_options: Optional[IndexingOptions]

keyword_tokenizer: Optional[Literal["porter", "trigram"]]

One of the following:

"porter"

"trigram"

last_activity: Optional[datetime]

formatdate-time

max_num_results: Optional[int]

maximum50

minimum1

metadata: Optional[Metadata]

created_from_aisearch_wizard: Optional[bool]

worker_domain: Optional[str]

modified_by: Optional[str]

namespace: Optional[str]

paused: Optional[bool]

public_endpoint_id: Optional[str]

public_endpoint_params: Optional[PublicEndpointParams]

authorized_hosts: Optional[List[str]]

chat_completions_endpoint: Optional[PublicEndpointParamsChatCompletionsEndpoint]

disabled: Optional[bool]

Disable chat completions endpoint for this public endpoint

custom_domains: Optional[List[str]]

enabled: Optional[bool]

mcp: Optional[PublicEndpointParamsMcp]

description: Optional[str]

disabled: Optional[bool]

Disable MCP endpoint for this public endpoint

rate_limit: Optional[PublicEndpointParamsRateLimit]

period_ms: Optional[int]

maximum3600000

minimum60000

requests: Optional[int]

minimum1

technique: Optional[Literal["fixed", "sliding"]]

One of the following:

"fixed"

"sliding"

search_endpoint: Optional[PublicEndpointParamsSearchEndpoint]

disabled: Optional[bool]

Disable search endpoint for this public endpoint

reranking: Optional[bool]

reranking_model: Optional[Literal["@cf/baai/bge-reranker-base", ""]]

One of the following:

"@cf/baai/bge-reranker-base"

retrieval_options: Optional[RetrievalOptions]

boost_by: Optional[List[RetrievalOptionsBoostBy]]

field: str

maxLength64

minLength1

direction: Optional[Literal["asc", "desc", "exists", "not_exists"]]

One of the following:

"asc"

"desc"

"exists"

"not_exists"

keyword_match_mode: Optional[Literal["and", "or"]]

One of the following:

"and"

"or"

rewrite_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

rewrite_query: Optional[bool]

score_threshold: Optional[float]

maximum1

minimum0

source: Optional[str]

source_params: Optional[SourceParams]

exclude_items: Optional[List[str]]

List of path patterns to exclude. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /admin/** matches /admin/users and /admin/settings/advanced)

include_items: Optional[List[str]]

List of path patterns to include. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /blog/** matches /blog/post and /blog/2024/post)

prefix: Optional[str]

r2_jurisdiction: Optional[str]

web_crawler: Optional[SourceParamsWebCrawler]

parse_options: Optional[SourceParamsWebCrawlerParseOptions]

content_selector: Optional[List[SourceParamsWebCrawlerParseOptionsContentSelector]]

path: str

Glob pattern to match against the page URL path. Uses standard glob syntax: * matches within a segment, ** crosses directories.

maxLength200

minLength1

selector: str

maxLength200

minLength1

include_headers: Optional[Dict[str, str]]

Up to 5 custom HTTP headers sent with each crawl request. Names must be RFC-7230 token characters (no spaces, colons, or control characters); values must be HTAB + printable ASCII (no CR/LF).

include_images: Optional[bool]

specific_sitemaps: Optional[List[str]]

List of specific sitemap URLs to use for crawling. Only valid when parse_type is ‘sitemap’.

use_browser_rendering: Optional[bool]

parse_type: Optional[Literal["sitemap", "crawl"]]

One of the following:

"sitemap"

"crawl"

status: Optional[str]

sync_interval: Optional[Literal[900, 1800, 3600, 5 more]]

Interval between automatic syncs, in seconds. Allowed values: 900 (15min), 1800 (30min), 3600 (1h), 7200 (2h), 14400 (4h), 21600 (6h), 43200 (12h), 86400 (24h).

One of the following:

900

1800

3600

7200

14400

21600

43200

86400

token_id: Optional[str]

formatuuid

type: Optional[Literal["r2", "web-crawler"]]

One of the following:

"r2"

"web-crawler"

class InstanceUpdateResponse: …

id: str

AI Search instance ID. Lowercase alphanumeric, hyphens, and underscores.

maxLength64

minLength1

created_at: datetime

formatdate-time

modified_at: datetime

formatdate-time

ai_gateway_id: Optional[str]

aisearch_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

cache: Optional[bool]

cache_threshold: Optional[Literal["super_strict_match", "close_enough", "flexible_friend", "anything_goes"]]

One of the following:

"super_strict_match"

"close_enough"

"flexible_friend"

"anything_goes"

cache_ttl: Optional[Literal[600, 1800, 3600, 7 more]]

Cache entry TTL in seconds. Allowed values: 600 (10min), 1800 (30min), 3600 (1h), 7200 (2h), 21600 (6h), 43200 (12h), 86400 (24h), 172800 (48h), 259200 (72h), 518400 (6d).

One of the following:

600

1800

3600

7200

21600

43200

86400

172800

259200

518400

chunk_overlap: Optional[int]

maximum30

minimum0

chunk_size: Optional[int]

minimum64

created_by: Optional[str]

custom_metadata: Optional[List[CustomMetadata]]

data_type: Literal["text", "number", "boolean", "datetime"]

One of the following:

"text"

"number"

"boolean"

"datetime"

field_name: str

maxLength64

minLength1

embedding_model: Optional[Literal["@cf/qwen/qwen3-embedding-0.6b", "@cf/qwen/qwen3-vl-embedding-2b", "@cf/baai/bge-m3", 8 more]]

One of the following:

"@cf/qwen/qwen3-embedding-0.6b"

"@cf/qwen/qwen3-vl-embedding-2b"

"@cf/baai/bge-m3"

"@cf/baai/bge-large-en-v1.5"

"@cf/google/embeddinggemma-300m"

"google-ai-studio/gemini-embedding-001"

"google-ai-studio/gemini-embedding-2-preview"

"google-ai-studio/gemini-embedding-2"

"openai/text-embedding-3-small"

"openai/text-embedding-3-large"

enable: Optional[bool]

engine_version: Optional[float]

fusion_method: Optional[Literal["max", "rrf"]]

One of the following:

"max"

"rrf"

Deprecatedhybrid_search_enabled: Optional[bool]

Deprecated — use index_method instead.

index_method: Optional[IndexMethod]

Controls which storage backends are used during indexing. Defaults to vector-only.

keyword: bool

Enable keyword (BM25) storage backend.

vector: bool

Enable vector (embedding) storage backend.

indexing_options: Optional[IndexingOptions]

keyword_tokenizer: Optional[Literal["porter", "trigram"]]

One of the following:

"porter"

"trigram"

last_activity: Optional[datetime]

formatdate-time

max_num_results: Optional[int]

maximum50

minimum1

metadata: Optional[Metadata]

created_from_aisearch_wizard: Optional[bool]

worker_domain: Optional[str]

modified_by: Optional[str]

namespace: Optional[str]

paused: Optional[bool]

public_endpoint_id: Optional[str]

public_endpoint_params: Optional[PublicEndpointParams]

authorized_hosts: Optional[List[str]]

chat_completions_endpoint: Optional[PublicEndpointParamsChatCompletionsEndpoint]

disabled: Optional[bool]

Disable chat completions endpoint for this public endpoint

custom_domains: Optional[List[str]]

enabled: Optional[bool]

mcp: Optional[PublicEndpointParamsMcp]

description: Optional[str]

disabled: Optional[bool]

Disable MCP endpoint for this public endpoint

rate_limit: Optional[PublicEndpointParamsRateLimit]

period_ms: Optional[int]

maximum3600000

minimum60000

requests: Optional[int]

minimum1

technique: Optional[Literal["fixed", "sliding"]]

One of the following:

"fixed"

"sliding"

search_endpoint: Optional[PublicEndpointParamsSearchEndpoint]

disabled: Optional[bool]

Disable search endpoint for this public endpoint

reranking: Optional[bool]

reranking_model: Optional[Literal["@cf/baai/bge-reranker-base", ""]]

One of the following:

"@cf/baai/bge-reranker-base"

retrieval_options: Optional[RetrievalOptions]

boost_by: Optional[List[RetrievalOptionsBoostBy]]

field: str

maxLength64

minLength1

direction: Optional[Literal["asc", "desc", "exists", "not_exists"]]

One of the following:

"asc"

"desc"

"exists"

"not_exists"

keyword_match_mode: Optional[Literal["and", "or"]]

One of the following:

"and"

"or"

rewrite_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

rewrite_query: Optional[bool]

score_threshold: Optional[float]

maximum1

minimum0

source: Optional[str]

source_params: Optional[SourceParams]

exclude_items: Optional[List[str]]

List of path patterns to exclude. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /admin/** matches /admin/users and /admin/settings/advanced)

include_items: Optional[List[str]]

List of path patterns to include. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /blog/** matches /blog/post and /blog/2024/post)

prefix: Optional[str]

r2_jurisdiction: Optional[str]

web_crawler: Optional[SourceParamsWebCrawler]

parse_options: Optional[SourceParamsWebCrawlerParseOptions]

content_selector: Optional[List[SourceParamsWebCrawlerParseOptionsContentSelector]]

path: str

Glob pattern to match against the page URL path. Uses standard glob syntax: * matches within a segment, ** crosses directories.

maxLength200

minLength1

selector: str

maxLength200

minLength1

include_headers: Optional[Dict[str, str]]

Up to 5 custom HTTP headers sent with each crawl request. Names must be RFC-7230 token characters (no spaces, colons, or control characters); values must be HTAB + printable ASCII (no CR/LF).

include_images: Optional[bool]

specific_sitemaps: Optional[List[str]]

List of specific sitemap URLs to use for crawling. Only valid when parse_type is ‘sitemap’.

use_browser_rendering: Optional[bool]

parse_type: Optional[Literal["sitemap", "crawl"]]

One of the following:

"sitemap"

"crawl"

status: Optional[str]

sync_interval: Optional[Literal[900, 1800, 3600, 5 more]]

Interval between automatic syncs, in seconds. Allowed values: 900 (15min), 1800 (30min), 3600 (1h), 7200 (2h), 14400 (4h), 21600 (6h), 43200 (12h), 86400 (24h).

One of the following:

900

1800

3600

7200

14400

21600

43200

86400

token_id: Optional[str]

formatuuid

type: Optional[Literal["r2", "web-crawler"]]

One of the following:

"r2"

"web-crawler"

class InstanceDeleteResponse: …

id: str

AI Search instance ID. Lowercase alphanumeric, hyphens, and underscores.

maxLength64

minLength1

created_at: datetime

formatdate-time

modified_at: datetime

formatdate-time

ai_gateway_id: Optional[str]

aisearch_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

cache: Optional[bool]

cache_threshold: Optional[Literal["super_strict_match", "close_enough", "flexible_friend", "anything_goes"]]

One of the following:

"super_strict_match"

"close_enough"

"flexible_friend"

"anything_goes"

cache_ttl: Optional[Literal[600, 1800, 3600, 7 more]]

Cache entry TTL in seconds. Allowed values: 600 (10min), 1800 (30min), 3600 (1h), 7200 (2h), 21600 (6h), 43200 (12h), 86400 (24h), 172800 (48h), 259200 (72h), 518400 (6d).

One of the following:

600

1800

3600

7200

21600

43200

86400

172800

259200

518400

chunk_overlap: Optional[int]

maximum30

minimum0

chunk_size: Optional[int]

minimum64

created_by: Optional[str]

custom_metadata: Optional[List[CustomMetadata]]

data_type: Literal["text", "number", "boolean", "datetime"]

One of the following:

"text"

"number"

"boolean"

"datetime"

field_name: str

maxLength64

minLength1

embedding_model: Optional[Literal["@cf/qwen/qwen3-embedding-0.6b", "@cf/qwen/qwen3-vl-embedding-2b", "@cf/baai/bge-m3", 8 more]]

One of the following:

"@cf/qwen/qwen3-embedding-0.6b"

"@cf/qwen/qwen3-vl-embedding-2b"

"@cf/baai/bge-m3"

"@cf/baai/bge-large-en-v1.5"

"@cf/google/embeddinggemma-300m"

"google-ai-studio/gemini-embedding-001"

"google-ai-studio/gemini-embedding-2-preview"

"google-ai-studio/gemini-embedding-2"

"openai/text-embedding-3-small"

"openai/text-embedding-3-large"

enable: Optional[bool]

engine_version: Optional[float]

fusion_method: Optional[Literal["max", "rrf"]]

One of the following:

"max"

"rrf"

Deprecatedhybrid_search_enabled: Optional[bool]

Deprecated — use index_method instead.

index_method: Optional[IndexMethod]

Controls which storage backends are used during indexing. Defaults to vector-only.

keyword: bool

Enable keyword (BM25) storage backend.

vector: bool

Enable vector (embedding) storage backend.

indexing_options: Optional[IndexingOptions]

keyword_tokenizer: Optional[Literal["porter", "trigram"]]

One of the following:

"porter"

"trigram"

last_activity: Optional[datetime]

formatdate-time

max_num_results: Optional[int]

maximum50

minimum1

metadata: Optional[Metadata]

created_from_aisearch_wizard: Optional[bool]

worker_domain: Optional[str]

modified_by: Optional[str]

namespace: Optional[str]

paused: Optional[bool]

public_endpoint_id: Optional[str]

public_endpoint_params: Optional[PublicEndpointParams]

authorized_hosts: Optional[List[str]]

chat_completions_endpoint: Optional[PublicEndpointParamsChatCompletionsEndpoint]

disabled: Optional[bool]

Disable chat completions endpoint for this public endpoint

custom_domains: Optional[List[str]]

enabled: Optional[bool]

mcp: Optional[PublicEndpointParamsMcp]

description: Optional[str]

disabled: Optional[bool]

Disable MCP endpoint for this public endpoint

rate_limit: Optional[PublicEndpointParamsRateLimit]

period_ms: Optional[int]

maximum3600000

minimum60000

requests: Optional[int]

minimum1

technique: Optional[Literal["fixed", "sliding"]]

One of the following:

"fixed"

"sliding"

search_endpoint: Optional[PublicEndpointParamsSearchEndpoint]

disabled: Optional[bool]

Disable search endpoint for this public endpoint

reranking: Optional[bool]

reranking_model: Optional[Literal["@cf/baai/bge-reranker-base", ""]]

One of the following:

"@cf/baai/bge-reranker-base"

retrieval_options: Optional[RetrievalOptions]

boost_by: Optional[List[RetrievalOptionsBoostBy]]

field: str

maxLength64

minLength1

direction: Optional[Literal["asc", "desc", "exists", "not_exists"]]

One of the following:

"asc"

"desc"

"exists"

"not_exists"

keyword_match_mode: Optional[Literal["and", "or"]]

One of the following:

"and"

"or"

rewrite_model: Optional[Literal["@cf/meta/llama-3.3-70b-instruct-fp8-fast", "@cf/zai-org/glm-4.7-flash", "@cf/meta/llama-3.1-8b-instruct-fast", 27 more]]

One of the following:

"@cf/meta/llama-3.3-70b-instruct-fp8-fast"

"@cf/zai-org/glm-4.7-flash"

"@cf/meta/llama-3.1-8b-instruct-fast"

"@cf/meta/llama-3.1-8b-instruct-fp8"

"@cf/meta/llama-4-scout-17b-16e-instruct"

"@cf/qwen/qwen3-30b-a3b-fp8"

"@cf/deepseek-ai/deepseek-r1-distill-qwen-32b"

"@cf/moonshotai/kimi-k2-instruct"

"@cf/google/gemma-3-12b-it"

"@cf/google/gemma-4-26b-a4b-it"

"@cf/moonshotai/kimi-k2.5"

"anthropic/claude-3-7-sonnet"

"anthropic/claude-sonnet-4"

"anthropic/claude-opus-4"

"anthropic/claude-3-5-haiku"

"cerebras/qwen-3-235b-a22b-instruct"

"cerebras/qwen-3-235b-a22b-thinking"

"cerebras/llama-3.3-70b"

"cerebras/llama-4-maverick-17b-128e-instruct"

"cerebras/llama-4-scout-17b-16e-instruct"

"cerebras/gpt-oss-120b"

"google-ai-studio/gemini-2.5-flash"

"google-ai-studio/gemini-2.5-pro"

"grok/grok-4"

"groq/llama-3.3-70b-versatile"

"groq/llama-3.1-8b-instant"

"openai/gpt-5"

"openai/gpt-5-mini"

"openai/gpt-5-nano"

rewrite_query: Optional[bool]

score_threshold: Optional[float]

maximum1

minimum0

source: Optional[str]

source_params: Optional[SourceParams]

exclude_items: Optional[List[str]]

List of path patterns to exclude. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /admin/** matches /admin/users and /admin/settings/advanced)

include_items: Optional[List[str]]

List of path patterns to include. Uses micromatch glob syntax: * matches within a path segment, ** matches across path segments (e.g., /blog/** matches /blog/post and /blog/2024/post)

prefix: Optional[str]

r2_jurisdiction: Optional[str]

web_crawler: Optional[SourceParamsWebCrawler]

parse_options: Optional[SourceParamsWebCrawlerParseOptions]

content_selector: Optional[List[SourceParamsWebCrawlerParseOptionsContentSelector]]

path: str

Glob pattern to match against the page URL path. Uses standard glob syntax: * matches within a segment, ** crosses directories.

maxLength200

minLength1

selector: str

maxLength200

minLength1

include_headers: Optional[Dict[str, str]]

Up to 5 custom HTTP headers sent with each crawl request. Names must be RFC-7230 token characters (no spaces, colons, or control characters); values must be HTAB + printable ASCII (no CR/LF).

include_images: Optional[bool]

specific_sitemaps: Optional[List[str]]

List of specific sitemap URLs to use for crawling. Only valid when parse_type is ‘sitemap’.

use_browser_rendering: Optional[bool]

parse_type: Optional[Literal["sitemap", "crawl"]]

One of the following:

"sitemap"

"crawl"

status: Optional[str]

sync_interval: Optional[Literal[900, 1800, 3600, 5 more]]

Interval between automatic syncs, in seconds. Allowed values: 900 (15min), 1800 (30min), 3600 (1h), 7200 (2h), 14400 (4h), 21600 (6h), 43200 (12h), 86400 (24h).

One of the following:

900

1800

3600

7200

14400

21600

43200

86400

token_id: Optional[str]

formatuuid

type: Optional[Literal["r2", "web-crawler"]]

One of the following:

"r2"

"web-crawler"

class InstanceStatsResponse: …

completed: Optional[int]

degraded: Optional[bool]

True when status counts are unavailable (e.g. legacy stats query exceeded D1 statement-size limit). Counts are omitted in this case.

engine: Optional[Engine]

Engine-specific metadata. Present only for managed (v3) instances.

r2: Optional[EngineR2]

R2 bucket storage usage in bytes.

metadata_size_bytes: int

object_count: int

payload_size_bytes: int

vectorize: Optional[EngineVectorize]

Vectorize index metadata (dimensions, vector count).

dimensions: int

vectors_count: int

error: Optional[int]

file_embed_errors: Optional[Dict[str, object]]

index_source_errors: Optional[Dict[str, object]]

last_activity: Optional[datetime]

formatdate-time

outdated: Optional[int]

queued: Optional[int]

running: Optional[int]

skipped: Optional[int]

class InstanceSearchResponse: …

chunks: List[Chunk]

id: str

score: float

maximum1

minimum0

text: str

type: str

item: Optional[ChunkItem]

key: str

metadata: Optional[Dict[str, object]]

timestamp: Optional[float]

scoring_details: Optional[ChunkScoringDetails]

fusion_method: Optional[Literal["rrf", "max"]]

One of the following:

"rrf"

"max"

keyword_rank: Optional[float]

keyword_score: Optional[float]

minimum0

reranking_score: Optional[float]

maximum1

minimum0

vector_rank: Optional[float]

vector_score: Optional[float]

maximum1

minimum0

query_kind: Literal["text", "image", "multimodal"]

One of the following:

"text"

"image"

"multimodal"

search_query: Optional[str]

class InstanceChatCompletionsResponse: …

choices: List[Choice]

message: ChoiceMessage

content: Union[str, List[ChoiceMessageContentUnionMember1], null]

One of the following:

str

List[ChoiceMessageContentUnionMember1]

One of the following:

class ChoiceMessageContentUnionMember1UnionMember0: …

text: str

minLength1

type: Literal["text"]

class ChoiceMessageContentUnionMember1UnionMember1: …

image_url: ChoiceMessageContentUnionMember1UnionMember1ImageURL

url: str

maxLength20971520

minLength1

type: Literal["image_url"]

role: Literal["system", "developer", "user", 2 more]

One of the following:

"system"

"developer"

"user"

"assistant"

"tool"

index: Optional[int]

chunks: List[Chunk]

id: str

score: float

maximum1

minimum0

text: str

type: str

item: Optional[ChunkItem]

key: str

metadata: Optional[Dict[str, object]]

timestamp: Optional[float]

scoring_details: Optional[ChunkScoringDetails]

fusion_method: Optional[Literal["rrf", "max"]]

One of the following:

"rrf"

"max"

keyword_rank: Optional[float]

keyword_score: Optional[float]

minimum0

reranking_score: Optional[float]

maximum1

minimum0

vector_rank: Optional[float]

vector_score: Optional[float]

maximum1

minimum0

id: Optional[str]

model: Optional[str]

object: Optional[str]

ModelsExpand Collapse

class JobListResponse: …

id: str

source: Literal["user", "schedule"]

One of the following:

"user"

"schedule"

description: Optional[str]

end_reason: Optional[str]

ended_at: Optional[str]

last_seen_at: Optional[str]

started_at: Optional[str]

class JobCreateResponse: …

id: str

source: Literal["user", "schedule"]

One of the following:

"user"

"schedule"

description: Optional[str]

end_reason: Optional[str]

ended_at: Optional[str]

last_seen_at: Optional[str]

started_at: Optional[str]

class JobGetResponse: …

id: str

source: Literal["user", "schedule"]

One of the following:

"user"

"schedule"

description: Optional[str]

end_reason: Optional[str]

ended_at: Optional[str]

last_seen_at: Optional[str]

started_at: Optional[str]

List[JobLogsResponseItem]

id: int

created_at: float

message: str

message_type: int

Instances

List instances.

Create new instance.

Read instance.

Update instance.

Delete instance.

Stats

Search

Chat Completions

ModelsExpand Collapse

InstancesJobs

List Jobs

Create new job

Get a Job Details

List Job Logs

ModelsExpand Collapse