{
  "schemaVersion": "1.0",
  "item": {
    "slug": "arxiv-paper-processor",
    "name": "Arxiv Paper Processor",
    "source": "tencent",
    "type": "skill",
    "category": "效率提升",
    "sourceUrl": "https://clawhub.ai/xukp20/arxiv-paper-processor",
    "canonicalUrl": "https://clawhub.ai/xukp20/arxiv-paper-processor",
    "targetPlatform": "OpenClaw"
  },
  "install": {
    "downloadMode": "redirect",
    "downloadUrl": "/downloads/arxiv-paper-processor",
    "sourceDownloadUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=arxiv-paper-processor",
    "sourcePlatform": "tencent",
    "targetPlatform": "OpenClaw",
    "installMethod": "Manual import",
    "extraction": "Extract archive",
    "prerequisites": [
      "OpenClaw"
    ],
    "packageFormat": "ZIP package",
    "includedAssets": [
      "SKILL.md",
      "scripts/download_arxiv_pdf.py",
      "scripts/download_arxiv_source.py",
      "scripts/download_papers_batch.py",
      "references/summary-example-en.md",
      "references/summary-example-zh.md"
    ],
    "primaryDoc": "SKILL.md",
    "quickSetup": [
      "Download the package from Yavira.",
      "Extract the archive and review SKILL.md first.",
      "Import or place the package into your OpenClaw setup."
    ],
    "agentAssist": {
      "summary": "Hand the extracted package to your coding agent with a concrete install brief instead of figuring it out manually.",
      "steps": [
        "Download the package from Yavira.",
        "Extract it into a folder your agent can access.",
        "Paste one of the prompts below and point your agent at the extracted folder."
      ],
      "prompts": [
        {
          "label": "New install",
          "body": "I downloaded a skill package from Yavira. Read SKILL.md from the extracted folder and install it by following the included instructions. Tell me what you changed and call out any manual steps you could not complete."
        },
        {
          "label": "Upgrade existing",
          "body": "I downloaded an updated skill package from Yavira. Read SKILL.md from the extracted folder, compare it with my current installation, and upgrade it while preserving any custom configuration unless the package docs explicitly say otherwise. Summarize what changed and any follow-up checks I should run."
        }
      ]
    },
    "sourceHealth": {
      "source": "tencent",
      "status": "healthy",
      "reason": "direct_download_ok",
      "recommendedAction": "download",
      "checkedAt": "2026-04-23T16:43:11.935Z",
      "expiresAt": "2026-04-30T16:43:11.935Z",
      "httpStatus": 200,
      "finalUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=4claw-imageboard",
      "contentType": "application/zip",
      "probeMethod": "head",
      "details": {
        "probeUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=4claw-imageboard",
        "contentDisposition": "attachment; filename=\"4claw-imageboard-1.0.1.zip\"",
        "redirectLocation": null,
        "bodySnippet": null
      },
      "scope": "source",
      "summary": "Source download looks usable.",
      "detail": "Yavira can redirect you to the upstream package for this source.",
      "primaryActionLabel": "Download for OpenClaw",
      "primaryActionHref": "/downloads/arxiv-paper-processor"
    },
    "validation": {
      "installChecklist": [
        "Use the Yavira download entry.",
        "Review SKILL.md after the package is downloaded.",
        "Confirm the extracted package contains the expected setup assets."
      ],
      "postInstallChecks": [
        "Confirm the extracted package includes the expected docs or setup files.",
        "Validate the skill or prompts are available in your target agent workspace.",
        "Capture any manual follow-up steps the agent could not complete."
      ]
    },
    "downloadPageUrl": "https://openagent3.xyz/downloads/arxiv-paper-processor",
    "agentPageUrl": "https://openagent3.xyz/skills/arxiv-paper-processor/agent",
    "manifestUrl": "https://openagent3.xyz/skills/arxiv-paper-processor/agent.json",
    "briefUrl": "https://openagent3.xyz/skills/arxiv-paper-processor/agent.md"
  },
  "agentAssist": {
    "summary": "Hand the extracted package to your coding agent with a concrete install brief instead of figuring it out manually.",
    "steps": [
      "Download the package from Yavira.",
      "Extract it into a folder your agent can access.",
      "Paste one of the prompts below and point your agent at the extracted folder."
    ],
    "prompts": [
      {
        "label": "New install",
        "body": "I downloaded a skill package from Yavira. Read SKILL.md from the extracted folder and install it by following the included instructions. Tell me what you changed and call out any manual steps you could not complete."
      },
      {
        "label": "Upgrade existing",
        "body": "I downloaded an updated skill package from Yavira. Read SKILL.md from the extracted folder, compare it with my current installation, and upgrade it while preserving any custom configuration unless the package docs explicitly say otherwise. Summarize what changed and any follow-up checks I should run."
      }
    ]
  },
  "documentation": {
    "source": "clawhub",
    "primaryDoc": "SKILL.md",
    "sections": [
      {
        "title": "ArXiv Paper Processor",
        "body": "Use this skill for per-paper manual summarization, with optional batch artifact download.\n\nSingle-paper mode: process one paper directory (e.g. <run_dir>/<arxiv_id>/).\nBatch predownload mode: process many paper directories under one run dir before writing summaries."
      },
      {
        "title": "Language Parameter",
        "body": "Use a workflow language parameter (for example English or Chinese) and apply it manually.\nThe per-paper summary.md must be written in the selected language.\nIf download scripts are called directly, pass --language <LANG> for traceability."
      },
      {
        "title": "Core Principle",
        "body": "Scripts only fetch artifacts. The model performs reading and writing."
      },
      {
        "title": "Non-negotiable Constraint",
        "body": "Do not generate summary.md by script-based snippet extraction, regex harvesting, or template autofill.\nDo not use Python/shell scripts to auto-compose section text from abstract/introduction fragments.\nScripts in this skill are only for artifact download (source/pdf) and trace logs.\nThe final summary.md must come from model-side reading and synthesis of the paper content."
      },
      {
        "title": "Optional Batch Artifact Download (Many Papers)",
        "body": "Use this first when Stage B has many papers:\n\npython3 scripts/download_papers_batch.py \\\n  --run-dir /path/to/run \\\n  --artifact source_then_pdf \\\n  --max-workers 3 \\\n  --min-interval-sec 5 \\\n  --language English\n\nKey behavior:\n\nSupports --artifact source, --artifact pdf, or --artifact source_then_pdf (default).\nSupports concurrency (--max-workers) and safe throttling/retry (--min-interval-sec, retry args).\nUses run-local throttle state by default (<run_dir>/.runtime/arxiv_download_state.json) to reduce 429 risk.\nSkips papers that already have usable source/source_extract/*.tex or existing source/paper.pdf (unless --force).\nResume-friendly: if a paper already has a completed summary.md, you can skip that paper's summary-writing step.\nWrites batch log to <run_dir>/download_batch_log.json by default."
      },
      {
        "title": "Step 1: Download Source (Preferred)",
        "body": "python3 scripts/download_arxiv_source.py \\\n  --paper-dir /path/to/run/2602.00528 \\\n  --language English\n\nThis writes:\n\nsource/source_bundle.bin\nsource/source_extract/\nsource/download_source_log.json\n\nIf usable source already exists and --force is not set, the script reuses local artifacts."
      },
      {
        "title": "Step 2: If Needed, Download PDF",
        "body": "python3 scripts/download_arxiv_pdf.py \\\n  --paper-dir /path/to/run/2602.00528 \\\n  --language English\n\nThis writes:\n\nsource/paper.pdf\nsource/download_pdf_log.json\n\nIf PDF already exists and --force is not set, the script reuses local artifacts."
      },
      {
        "title": "Step 3: Model Reads and Summarizes",
        "body": "If summary.md already exists and follows the required format, skip this paper and mark it complete.\nRead metadata.md first.\nIf source/source_extract/ already exists with readable .tex files, use it directly.\nOtherwise, if source/paper.pdf already exists, use PDF directly.\nIf neither exists, run download scripts (single-paper scripts or batch script) first.\nManually write summary.md in the same paper directory, in the selected language.\n\nDo not rely on rule-based auto summarization.\nDo not rely on auto-extracted snippets as the primary writing basis."
      },
      {
        "title": "Quality Requirement",
        "body": "Every section should include paper-specific details that are traceable to full-text reading.\nSection 4/5/10 should reflect concrete method and evaluation details, not generic wording.\nIf key details are unclear in the source, explicitly note uncertainty instead of guessing.\nMatch the detail level shown in references/summary-example-en.md and references/summary-example-zh.md.\nIf your draft is clearly shorter or less specific than the examples, expand it before finishing."
      },
      {
        "title": "Required Output",
        "body": "<paper_dir>/summary.md in fixed section format.\nPay special attention to section ## 10. Brief Conclusion: write a 3-4 sentence mini-conclusion that covers contribution, method, evaluation setup, and results with paper-specific details.\nIn section ## 1. Paper Snapshot, use exact keys: ArXiv ID, Title, Authors, Publish date, Primary category, Reading basis.\nDo not use key variants such as Reading source, Author list, Published on, or lowercase key names.\n\nSee references/summary-format.md for exact section requirements."
      },
      {
        "title": "Related Skills",
        "body": "This skill is a sub-skill of arxiv-summarizer-orchestrator.\n\nPipeline position:\n\nStep 1 (upstream): arxiv-search-collector produces the selected paper directories and metadata.\nStep 2 (this skill): arxiv-paper-processor downloads artifacts and writes one summary.md per paper.\nStep 3 (downstream): arxiv-batch-reporter uses these per-paper summaries to generate the final collection report.\n\nUse this skill together with Step 1 and Step 3 for full end-to-end execution."
      }
    ],
    "body": "ArXiv Paper Processor\n\nUse this skill for per-paper manual summarization, with optional batch artifact download.\n\nSingle-paper mode: process one paper directory (e.g. <run_dir>/<arxiv_id>/).\nBatch predownload mode: process many paper directories under one run dir before writing summaries.\nLanguage Parameter\nUse a workflow language parameter (for example English or Chinese) and apply it manually.\nThe per-paper summary.md must be written in the selected language.\nIf download scripts are called directly, pass --language <LANG> for traceability.\nCore Principle\n\nScripts only fetch artifacts. The model performs reading and writing.\n\nNon-negotiable Constraint\nDo not generate summary.md by script-based snippet extraction, regex harvesting, or template autofill.\nDo not use Python/shell scripts to auto-compose section text from abstract/introduction fragments.\nScripts in this skill are only for artifact download (source/pdf) and trace logs.\nThe final summary.md must come from model-side reading and synthesis of the paper content.\nOptional Batch Artifact Download (Many Papers)\n\nUse this first when Stage B has many papers:\n\npython3 scripts/download_papers_batch.py \\\n  --run-dir /path/to/run \\\n  --artifact source_then_pdf \\\n  --max-workers 3 \\\n  --min-interval-sec 5 \\\n  --language English\n\n\nKey behavior:\n\nSupports --artifact source, --artifact pdf, or --artifact source_then_pdf (default).\nSupports concurrency (--max-workers) and safe throttling/retry (--min-interval-sec, retry args).\nUses run-local throttle state by default (<run_dir>/.runtime/arxiv_download_state.json) to reduce 429 risk.\nSkips papers that already have usable source/source_extract/*.tex or existing source/paper.pdf (unless --force).\nResume-friendly: if a paper already has a completed summary.md, you can skip that paper's summary-writing step.\nWrites batch log to <run_dir>/download_batch_log.json by default.\nStep 1: Download Source (Preferred)\npython3 scripts/download_arxiv_source.py \\\n  --paper-dir /path/to/run/2602.00528 \\\n  --language English\n\n\nThis writes:\n\nsource/source_bundle.bin\nsource/source_extract/\nsource/download_source_log.json\n\nIf usable source already exists and --force is not set, the script reuses local artifacts.\n\nStep 2: If Needed, Download PDF\npython3 scripts/download_arxiv_pdf.py \\\n  --paper-dir /path/to/run/2602.00528 \\\n  --language English\n\n\nThis writes:\n\nsource/paper.pdf\nsource/download_pdf_log.json\n\nIf PDF already exists and --force is not set, the script reuses local artifacts.\n\nStep 3: Model Reads and Summarizes\nIf summary.md already exists and follows the required format, skip this paper and mark it complete.\nRead metadata.md first.\nIf source/source_extract/ already exists with readable .tex files, use it directly.\nOtherwise, if source/paper.pdf already exists, use PDF directly.\nIf neither exists, run download scripts (single-paper scripts or batch script) first.\nManually write summary.md in the same paper directory, in the selected language.\n\nDo not rely on rule-based auto summarization. Do not rely on auto-extracted snippets as the primary writing basis.\n\nQuality Requirement\nEvery section should include paper-specific details that are traceable to full-text reading.\nSection 4/5/10 should reflect concrete method and evaluation details, not generic wording.\nIf key details are unclear in the source, explicitly note uncertainty instead of guessing.\nMatch the detail level shown in references/summary-example-en.md and references/summary-example-zh.md.\nIf your draft is clearly shorter or less specific than the examples, expand it before finishing.\nRequired Output\n<paper_dir>/summary.md in fixed section format.\nPay special attention to section ## 10. Brief Conclusion: write a 3-4 sentence mini-conclusion that covers contribution, method, evaluation setup, and results with paper-specific details.\nIn section ## 1. Paper Snapshot, use exact keys: ArXiv ID, Title, Authors, Publish date, Primary category, Reading basis.\nDo not use key variants such as Reading source, Author list, Published on, or lowercase key names.\n\nSee references/summary-format.md for exact section requirements.\n\nRelated Skills\n\nThis skill is a sub-skill of arxiv-summarizer-orchestrator.\n\nPipeline position:\n\nStep 1 (upstream): arxiv-search-collector produces the selected paper directories and metadata.\nStep 2 (this skill): arxiv-paper-processor downloads artifacts and writes one summary.md per paper.\nStep 3 (downstream): arxiv-batch-reporter uses these per-paper summaries to generate the final collection report.\n\nUse this skill together with Step 1 and Step 3 for full end-to-end execution."
  },
  "trust": {
    "sourceLabel": "tencent",
    "provenanceUrl": "https://clawhub.ai/xukp20/arxiv-paper-processor",
    "publisherUrl": "https://clawhub.ai/xukp20/arxiv-paper-processor",
    "owner": "xukp20",
    "version": "0.1.1",
    "license": null,
    "verificationStatus": "Indexed source record"
  },
  "links": {
    "detailUrl": "https://openagent3.xyz/skills/arxiv-paper-processor",
    "downloadUrl": "https://openagent3.xyz/downloads/arxiv-paper-processor",
    "agentUrl": "https://openagent3.xyz/skills/arxiv-paper-processor/agent",
    "manifestUrl": "https://openagent3.xyz/skills/arxiv-paper-processor/agent.json",
    "briefUrl": "https://openagent3.xyz/skills/arxiv-paper-processor/agent.md"
  }
}