inputSchema
{
"type": "object",
"required": [
"seedUrl"
],
"properties": {
"seedUrl": {
"type": "string",
"description": "HTTP(S) page URL; host must be in network.allowedDomains (whitelisted govt sites)."
},
"maxPages": {
"type": "integer",
"description": "Max pages to fetch including the seed, when followPagination. Default 1, max 50."
},
"linkScope": {
"enum": [
"default",
"single_page_downloadable"
],
"type": "string",
"description": "single_page: only the seed list screen (no pagination/nested); still list→detail on that screen for whitelisted sites. default: pagination and nested depth when enabled."
},
"collectPdf": {
"type": "boolean",
"description": "Include .pdf in items. Default true."
},
"maxTotalFetches": {
"type": "integer",
"description": "Max HTTP GETs per invocation. Default 200, max 200."
},
"nestedLinkDepth": {
"type": "integer",
"description": "0, 1, or 2. Same-origin navigable hrefs: fetch 1 or 2 levels of child pages to collect more file links. Default 0."
},
"followPagination": {
"type": "boolean",
"description": "If true, try to follow rel=next, next link, 下一页; maxPages; SPA may not work."
},
"extraAllowedHosts": {
"type": "array",
"items": {
"type": "string"
},
"description": "Optional extra hostnames for link/download allowlist; kb-assistant-app merges local user-allowlist.json here. Cloud WASM typically ignores."
},
"followDetailPages": {
"type": "boolean",
"description": "When true (default): follow article/detail links from the list (PBOC tiaofasi: emit detail-page HTML URLs for indexing; list-page file hrefs still collected). When false: only file-like hrefs on the list HTML."
},
"maxNestedUrlsPerLevel": {
"type": "integer",
"description": "Cap of distinct URLs to follow per nested level. Default 12, max 40."
}
}
}
outputSchema
{
"type": "object",
"required": [
"site",
"items"
],
"properties": {
"site": {
"type": "string"
},
"error": {
"type": "string"
},
"items": {
"type": "array",
"items": {
"type": "object",
"required": [
"url",
"title"
],
"properties": {
"url": {
"type": "string"
},
"title": {
"type": "string"
}
}
}
}
}
}