{
  "schemaVersion": "1.0",
  "item": {
    "slug": "arxiv-summarizer-orchestrator",
    "name": "Arxiv Summarizer Orchestrator",
    "source": "tencent",
    "type": "skill",
    "category": "AI 智能",
    "sourceUrl": "https://clawhub.ai/xukp20/arxiv-summarizer-orchestrator",
    "canonicalUrl": "https://clawhub.ai/xukp20/arxiv-summarizer-orchestrator",
    "targetPlatform": "OpenClaw"
  },
  "install": {
    "downloadMode": "redirect",
    "downloadUrl": "/downloads/arxiv-summarizer-orchestrator",
    "sourceDownloadUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=arxiv-summarizer-orchestrator",
    "sourcePlatform": "tencent",
    "targetPlatform": "OpenClaw",
    "installMethod": "Manual import",
    "extraction": "Extract archive",
    "prerequisites": [
      "OpenClaw"
    ],
    "packageFormat": "ZIP package",
    "includedAssets": [
      "SKILL.md",
      "references/workflow-checklist.md",
      "agents/openai.yaml"
    ],
    "primaryDoc": "SKILL.md",
    "quickSetup": [
      "Download the package from Yavira.",
      "Extract the archive and review SKILL.md first.",
      "Import or place the package into your OpenClaw setup."
    ],
    "agentAssist": {
      "summary": "Hand the extracted package to your coding agent with a concrete install brief instead of figuring it out manually.",
      "steps": [
        "Download the package from Yavira.",
        "Extract it into a folder your agent can access.",
        "Paste one of the prompts below and point your agent at the extracted folder."
      ],
      "prompts": [
        {
          "label": "New install",
          "body": "I downloaded a skill package from Yavira. Read SKILL.md from the extracted folder and install it by following the included instructions. Tell me what you changed and call out any manual steps you could not complete."
        },
        {
          "label": "Upgrade existing",
          "body": "I downloaded an updated skill package from Yavira. Read SKILL.md from the extracted folder, compare it with my current installation, and upgrade it while preserving any custom configuration unless the package docs explicitly say otherwise. Summarize what changed and any follow-up checks I should run."
        }
      ]
    },
    "sourceHealth": {
      "source": "tencent",
      "status": "healthy",
      "reason": "direct_download_ok",
      "recommendedAction": "download",
      "checkedAt": "2026-04-23T16:43:11.935Z",
      "expiresAt": "2026-04-30T16:43:11.935Z",
      "httpStatus": 200,
      "finalUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=4claw-imageboard",
      "contentType": "application/zip",
      "probeMethod": "head",
      "details": {
        "probeUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=4claw-imageboard",
        "contentDisposition": "attachment; filename=\"4claw-imageboard-1.0.1.zip\"",
        "redirectLocation": null,
        "bodySnippet": null
      },
      "scope": "source",
      "summary": "Source download looks usable.",
      "detail": "Yavira can redirect you to the upstream package for this source.",
      "primaryActionLabel": "Download for OpenClaw",
      "primaryActionHref": "/downloads/arxiv-summarizer-orchestrator"
    },
    "validation": {
      "installChecklist": [
        "Use the Yavira download entry.",
        "Review SKILL.md after the package is downloaded.",
        "Confirm the extracted package contains the expected setup assets."
      ],
      "postInstallChecks": [
        "Confirm the extracted package includes the expected docs or setup files.",
        "Validate the skill or prompts are available in your target agent workspace.",
        "Capture any manual follow-up steps the agent could not complete."
      ]
    },
    "downloadPageUrl": "https://openagent3.xyz/downloads/arxiv-summarizer-orchestrator",
    "agentPageUrl": "https://openagent3.xyz/skills/arxiv-summarizer-orchestrator/agent",
    "manifestUrl": "https://openagent3.xyz/skills/arxiv-summarizer-orchestrator/agent.json",
    "briefUrl": "https://openagent3.xyz/skills/arxiv-summarizer-orchestrator/agent.md"
  },
  "agentAssist": {
    "summary": "Hand the extracted package to your coding agent with a concrete install brief instead of figuring it out manually.",
    "steps": [
      "Download the package from Yavira.",
      "Extract it into a folder your agent can access.",
      "Paste one of the prompts below and point your agent at the extracted folder."
    ],
    "prompts": [
      {
        "label": "New install",
        "body": "I downloaded a skill package from Yavira. Read SKILL.md from the extracted folder and install it by following the included instructions. Tell me what you changed and call out any manual steps you could not complete."
      },
      {
        "label": "Upgrade existing",
        "body": "I downloaded an updated skill package from Yavira. Read SKILL.md from the extracted folder, compare it with my current installation, and upgrade it while preserving any custom configuration unless the package docs explicitly say otherwise. Summarize what changed and any follow-up checks I should run."
      }
    ]
  },
  "documentation": {
    "source": "clawhub",
    "primaryDoc": "SKILL.md",
    "sections": [
      {
        "title": "ArXiv Summarizer Orchestrator",
        "body": "Run the full pipeline by composing three sub-skills."
      },
      {
        "title": "Sub-skill Order",
        "body": "arxiv-search-collector\narxiv-paper-processor\narxiv-batch-reporter"
      },
      {
        "title": "Workflow Parameters",
        "body": "language: manual language parameter used by all stages. Default is English when omitted.\npaper_processing_mode: subagent_parallel or serial.\nmax_parallel_papers: default 5 when paper_processing_mode=subagent_parallel."
      },
      {
        "title": "Stage A: Collection Setup + Query Retrieval",
        "body": "Initialize one run with arxiv-search-collector/scripts/init_collection_run.py.\nModel generates multiple focused queries from original topic and writes a minimal query_plan.json (label + query only).\nRun arxiv-search-collector/scripts/fetch_queries_batch.py with the plan file (recommended).\n(Optional fallback) call arxiv-search-collector/scripts/fetch_query_metadata.py manually for one-by-one fetch.\nModel reads each indexed query list and decides keep indexes.\nMerge selected items with arxiv-search-collector/scripts/merge_selected_papers.py.\nIf relevance/coverage is still not good, iterate Stage A:\n\ngenerate another query plan with new labels,\nfetch again,\nre-merge with --incremental and updated selection-json.\nset weak labels to empty keep list ([]) to explicitly drop them.\n\nPass --language <LANG> to collector scripts so all generated markdown files in Stage A follow the selected language.\nUse serial query fetch in Stage A with conservative controls (for example --min-interval-sec 5, --retry-max 4).\nDefault collector settings already include retries/backoff and run-local throttle state (<run_dir>/.runtime/arxiv_api_state.json), so manual tuning is usually unnecessary.\nPrefer cache reuse (no --force) unless query parameters changed or data refresh is required.\n\nOutput: one run directory with per-paper metadata subdirectories."
      },
      {
        "title": "Stage B: Per-paper Artifact Download + Manual Summary",
        "body": "For each paper directory, invoke sub-skill arxiv-paper-processor once and let that skill produce <paper_dir>/summary.md.\n\nRecommended pre-step for many papers:\n\nRun one batch artifact download before per-paper reading:\n\npython3 arxiv-paper-processor/scripts/download_papers_batch.py \\\n  --run-dir /path/to/run \\\n  --artifact source_then_pdf \\\n  --max-workers 3 \\\n  --min-interval-sec 5 \\\n  --language <LANG>\n\nPer-paper execution steps (inside arxiv-paper-processor):\n\nIf <paper_dir>/summary.md already exists and is complete, skip this paper.\nIf usable source (source/source_extract/*.tex) or PDF (source/paper.pdf) already exists, skip download.\nIf artifacts are missing, download source with arxiv-paper-processor/scripts/download_arxiv_source.py.\nIf source is unusable, download PDF with arxiv-paper-processor/scripts/download_arxiv_pdf.py.\nModel reads content and manually writes <paper_dir>/summary.md by reference format, in language.\n\nParallel strategy for many papers:\n\nDefault: paper_processing_mode=subagent_parallel with max_parallel_papers=5.\nOptional: paper_processing_mode=serial to process one paper at a time.\nIn parallel mode, run multiple arxiv-paper-processor instances in batches; concurrent papers must not exceed max_parallel_papers.\nWait for one batch to finish before starting the next batch.\nIn serial mode, run exactly one arxiv-paper-processor instance at a time.\nSubagent workers should only own one paper directory each to avoid file conflicts.\nDo not use scripts to auto-compose summary text; scripts are download-only tools.\n\nOutput: all paper directories contain summary.md."
      },
      {
        "title": "Stage C: Bundle + Final Hierarchical Report",
        "body": "Run arxiv-batch-reporter/scripts/collect_summaries_bundle.py --language <LANG>.\nModel reads summaries_bundle.md and writes collection_report_template.md in base dir.\nIn template, each paper leaf entry must include one standalone placeholder line: {{ARXIV_BRIEF:<arxiv_id>}}.\nRun arxiv-batch-reporter/scripts/render_collection_report.py to generate final collection_report.md.\nDo not manually paraphrase per-paper conclusion lines in final report; they must come from per-paper summary.md section 10 via script injection.\n\nIf language is non-English (for example Chinese), all intermediate markdown files and final reports should follow that language."
      },
      {
        "title": "Periodic Scheduling",
        "body": "This orchestrator is suitable for cron/scheduled execution in OpenClaw:\n\nFrequency examples: daily, weekly, monthly.\nFor rolling windows, use lookback (1d, 7d, 30d) when initializing runs."
      },
      {
        "title": "Output Layout",
        "body": "<output-root>/<topic>-<timestamp>-<range>/\n\ntask_meta.json, task_meta.md\nquery_results/, query_selection/\n<arxiv_id>/metadata.md + downloaded source/pdf + summary.md\nsummaries_bundle.md\ncollection_report_template.md\nfinal rendered collection report (e.g. collection_report.md)\n\nUse references/workflow-checklist.md as execution checklist."
      },
      {
        "title": "Related Skills",
        "body": "This is the top-level orchestration skill.\n\nBefore using it, install and enable these three sub-skills:\n\narxiv-search-collector\narxiv-paper-processor\narxiv-batch-reporter\n\nExecution order inside this orchestrator:\n\narxiv-search-collector (Stage A)\narxiv-paper-processor (Stage B)\narxiv-batch-reporter (Stage C)"
      }
    ],
    "body": "ArXiv Summarizer Orchestrator\n\nRun the full pipeline by composing three sub-skills.\n\nSub-skill Order\narxiv-search-collector\narxiv-paper-processor\narxiv-batch-reporter\nWorkflow Parameters\nlanguage: manual language parameter used by all stages. Default is English when omitted.\npaper_processing_mode: subagent_parallel or serial.\nmax_parallel_papers: default 5 when paper_processing_mode=subagent_parallel.\nWorkflow\nStage A: Collection Setup + Query Retrieval\nInitialize one run with arxiv-search-collector/scripts/init_collection_run.py.\nModel generates multiple focused queries from original topic and writes a minimal query_plan.json (label + query only).\nRun arxiv-search-collector/scripts/fetch_queries_batch.py with the plan file (recommended).\n(Optional fallback) call arxiv-search-collector/scripts/fetch_query_metadata.py manually for one-by-one fetch.\nModel reads each indexed query list and decides keep indexes.\nMerge selected items with arxiv-search-collector/scripts/merge_selected_papers.py.\nIf relevance/coverage is still not good, iterate Stage A:\ngenerate another query plan with new labels,\nfetch again,\nre-merge with --incremental and updated selection-json.\nset weak labels to empty keep list ([]) to explicitly drop them.\n\nPass --language <LANG> to collector scripts so all generated markdown files in Stage A follow the selected language. Use serial query fetch in Stage A with conservative controls (for example --min-interval-sec 5, --retry-max 4). Default collector settings already include retries/backoff and run-local throttle state (<run_dir>/.runtime/arxiv_api_state.json), so manual tuning is usually unnecessary. Prefer cache reuse (no --force) unless query parameters changed or data refresh is required.\n\nOutput: one run directory with per-paper metadata subdirectories.\n\nStage B: Per-paper Artifact Download + Manual Summary\n\nFor each paper directory, invoke sub-skill arxiv-paper-processor once and let that skill produce <paper_dir>/summary.md.\n\nRecommended pre-step for many papers:\n\nRun one batch artifact download before per-paper reading:\npython3 arxiv-paper-processor/scripts/download_papers_batch.py \\\n  --run-dir /path/to/run \\\n  --artifact source_then_pdf \\\n  --max-workers 3 \\\n  --min-interval-sec 5 \\\n  --language <LANG>\n\n\nPer-paper execution steps (inside arxiv-paper-processor):\n\nIf <paper_dir>/summary.md already exists and is complete, skip this paper.\nIf usable source (source/source_extract/*.tex) or PDF (source/paper.pdf) already exists, skip download.\nIf artifacts are missing, download source with arxiv-paper-processor/scripts/download_arxiv_source.py.\nIf source is unusable, download PDF with arxiv-paper-processor/scripts/download_arxiv_pdf.py.\nModel reads content and manually writes <paper_dir>/summary.md by reference format, in language.\n\nParallel strategy for many papers:\n\nDefault: paper_processing_mode=subagent_parallel with max_parallel_papers=5.\nOptional: paper_processing_mode=serial to process one paper at a time.\nIn parallel mode, run multiple arxiv-paper-processor instances in batches; concurrent papers must not exceed max_parallel_papers.\nWait for one batch to finish before starting the next batch.\nIn serial mode, run exactly one arxiv-paper-processor instance at a time.\nSubagent workers should only own one paper directory each to avoid file conflicts.\nDo not use scripts to auto-compose summary text; scripts are download-only tools.\n\nOutput: all paper directories contain summary.md.\n\nStage C: Bundle + Final Hierarchical Report\nRun arxiv-batch-reporter/scripts/collect_summaries_bundle.py --language <LANG>.\nModel reads summaries_bundle.md and writes collection_report_template.md in base dir.\nIn template, each paper leaf entry must include one standalone placeholder line: {{ARXIV_BRIEF:<arxiv_id>}}.\nRun arxiv-batch-reporter/scripts/render_collection_report.py to generate final collection_report.md.\nDo not manually paraphrase per-paper conclusion lines in final report; they must come from per-paper summary.md section 10 via script injection.\n\nIf language is non-English (for example Chinese), all intermediate markdown files and final reports should follow that language.\n\nPeriodic Scheduling\n\nThis orchestrator is suitable for cron/scheduled execution in OpenClaw:\n\nFrequency examples: daily, weekly, monthly.\nFor rolling windows, use lookback (1d, 7d, 30d) when initializing runs.\nOutput Layout\n\n<output-root>/<topic>-<timestamp>-<range>/\n\ntask_meta.json, task_meta.md\nquery_results/, query_selection/\n<arxiv_id>/metadata.md + downloaded source/pdf + summary.md\nsummaries_bundle.md\ncollection_report_template.md\nfinal rendered collection report (e.g. collection_report.md)\n\nUse references/workflow-checklist.md as execution checklist.\n\nRelated Skills\n\nThis is the top-level orchestration skill.\n\nBefore using it, install and enable these three sub-skills:\n\narxiv-search-collector\narxiv-paper-processor\narxiv-batch-reporter\n\nExecution order inside this orchestrator:\n\narxiv-search-collector (Stage A)\narxiv-paper-processor (Stage B)\narxiv-batch-reporter (Stage C)"
  },
  "trust": {
    "sourceLabel": "tencent",
    "provenanceUrl": "https://clawhub.ai/xukp20/arxiv-summarizer-orchestrator",
    "publisherUrl": "https://clawhub.ai/xukp20/arxiv-summarizer-orchestrator",
    "owner": "xukp20",
    "version": "0.1.1",
    "license": null,
    "verificationStatus": "Indexed source record"
  },
  "links": {
    "detailUrl": "https://openagent3.xyz/skills/arxiv-summarizer-orchestrator",
    "downloadUrl": "https://openagent3.xyz/downloads/arxiv-summarizer-orchestrator",
    "agentUrl": "https://openagent3.xyz/skills/arxiv-summarizer-orchestrator/agent",
    "manifestUrl": "https://openagent3.xyz/skills/arxiv-summarizer-orchestrator/agent.json",
    "briefUrl": "https://openagent3.xyz/skills/arxiv-summarizer-orchestrator/agent.md"
  }
}