{
  "schemaVersion": "1.0",
  "item": {
    "slug": "sre-engineer",
    "name": "Sre Engineer",
    "source": "tencent",
    "type": "skill",
    "category": "AI 智能",
    "sourceUrl": "https://clawhub.ai/Veeramanikandanr48/sre-engineer",
    "canonicalUrl": "https://clawhub.ai/Veeramanikandanr48/sre-engineer",
    "targetPlatform": "OpenClaw"
  },
  "install": {
    "downloadMode": "redirect",
    "downloadUrl": "/downloads/sre-engineer",
    "sourceDownloadUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=sre-engineer",
    "sourcePlatform": "tencent",
    "targetPlatform": "OpenClaw",
    "installMethod": "Manual import",
    "extraction": "Extract archive",
    "prerequisites": [
      "OpenClaw"
    ],
    "packageFormat": "ZIP package",
    "includedAssets": [
      "SKILL.md",
      "references/automation-toil.md",
      "references/error-budget-policy.md",
      "references/incident-chaos.md",
      "references/monitoring-alerting.md",
      "references/slo-sli-management.md"
    ],
    "primaryDoc": "SKILL.md",
    "quickSetup": [
      "Download the package from Yavira.",
      "Extract the archive and review SKILL.md first.",
      "Import or place the package into your OpenClaw setup."
    ],
    "agentAssist": {
      "summary": "Hand the extracted package to your coding agent with a concrete install brief instead of figuring it out manually.",
      "steps": [
        "Download the package from Yavira.",
        "Extract it into a folder your agent can access.",
        "Paste one of the prompts below and point your agent at the extracted folder."
      ],
      "prompts": [
        {
          "label": "New install",
          "body": "I downloaded a skill package from Yavira. Read SKILL.md from the extracted folder and install it by following the included instructions. Tell me what you changed and call out any manual steps you could not complete."
        },
        {
          "label": "Upgrade existing",
          "body": "I downloaded an updated skill package from Yavira. Read SKILL.md from the extracted folder, compare it with my current installation, and upgrade it while preserving any custom configuration unless the package docs explicitly say otherwise. Summarize what changed and any follow-up checks I should run."
        }
      ]
    },
    "sourceHealth": {
      "source": "tencent",
      "status": "healthy",
      "reason": "direct_download_ok",
      "recommendedAction": "download",
      "checkedAt": "2026-04-30T16:55:25.780Z",
      "expiresAt": "2026-05-07T16:55:25.780Z",
      "httpStatus": 200,
      "finalUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=network",
      "contentType": "application/zip",
      "probeMethod": "head",
      "details": {
        "probeUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=network",
        "contentDisposition": "attachment; filename=\"network-1.0.0.zip\"",
        "redirectLocation": null,
        "bodySnippet": null
      },
      "scope": "source",
      "summary": "Source download looks usable.",
      "detail": "Yavira can redirect you to the upstream package for this source.",
      "primaryActionLabel": "Download for OpenClaw",
      "primaryActionHref": "/downloads/sre-engineer"
    },
    "validation": {
      "installChecklist": [
        "Use the Yavira download entry.",
        "Review SKILL.md after the package is downloaded.",
        "Confirm the extracted package contains the expected setup assets."
      ],
      "postInstallChecks": [
        "Confirm the extracted package includes the expected docs or setup files.",
        "Validate the skill or prompts are available in your target agent workspace.",
        "Capture any manual follow-up steps the agent could not complete."
      ]
    },
    "downloadPageUrl": "https://openagent3.xyz/downloads/sre-engineer",
    "agentPageUrl": "https://openagent3.xyz/skills/sre-engineer/agent",
    "manifestUrl": "https://openagent3.xyz/skills/sre-engineer/agent.json",
    "briefUrl": "https://openagent3.xyz/skills/sre-engineer/agent.md"
  },
  "agentAssist": {
    "summary": "Hand the extracted package to your coding agent with a concrete install brief instead of figuring it out manually.",
    "steps": [
      "Download the package from Yavira.",
      "Extract it into a folder your agent can access.",
      "Paste one of the prompts below and point your agent at the extracted folder."
    ],
    "prompts": [
      {
        "label": "New install",
        "body": "I downloaded a skill package from Yavira. Read SKILL.md from the extracted folder and install it by following the included instructions. Tell me what you changed and call out any manual steps you could not complete."
      },
      {
        "label": "Upgrade existing",
        "body": "I downloaded an updated skill package from Yavira. Read SKILL.md from the extracted folder, compare it with my current installation, and upgrade it while preserving any custom configuration unless the package docs explicitly say otherwise. Summarize what changed and any follow-up checks I should run."
      }
    ]
  },
  "documentation": {
    "source": "clawhub",
    "primaryDoc": "SKILL.md",
    "sections": [
      {
        "title": "SRE Engineer",
        "body": "Senior Site Reliability Engineer with expertise in building highly reliable, scalable systems through SLI/SLO management, error budgets, capacity planning, and automation."
      },
      {
        "title": "Role Definition",
        "body": "You are a senior SRE with 10+ years of experience building and maintaining production systems at scale. You specialize in defining meaningful SLOs, managing error budgets, reducing toil through automation, and building resilient systems. Your focus is on sustainable reliability that enables feature velocity."
      },
      {
        "title": "When to Use This Skill",
        "body": "Defining SLIs/SLOs and error budgets\nImplementing reliability monitoring and alerting\nReducing operational toil through automation\nDesigning chaos engineering experiments\nManaging incidents and postmortems\nBuilding capacity planning models\nEstablishing on-call practices"
      },
      {
        "title": "Core Workflow",
        "body": "Assess reliability - Review architecture, SLOs, incidents, toil levels\nDefine SLOs - Identify meaningful SLIs and set appropriate targets\nImplement monitoring - Build golden signal dashboards and alerting\nAutomate toil - Identify repetitive tasks and build automation\nTest resilience - Design and execute chaos experiments"
      },
      {
        "title": "Reference Guide",
        "body": "Load detailed guidance based on context:\n\nTopicReferenceLoad WhenSLO/SLIreferences/slo-sli-management.mdDefining SLOs, calculating error budgetsError Budgetsreferences/error-budget-policy.mdManaging budgets, burn rates, policiesMonitoringreferences/monitoring-alerting.mdGolden signals, alert design, dashboardsAutomationreferences/automation-toil.mdToil reduction, automation patternsIncidentsreferences/incident-chaos.mdIncident response, chaos engineering"
      },
      {
        "title": "MUST DO",
        "body": "Define quantitative SLOs (e.g., 99.9% availability)\nCalculate error budgets from SLO targets\nMonitor golden signals (latency, traffic, errors, saturation)\nWrite blameless postmortems for all incidents\nMeasure toil and track reduction progress\nAutomate repetitive operational tasks\nTest failure scenarios with chaos engineering\nBalance reliability with feature velocity"
      },
      {
        "title": "MUST NOT DO",
        "body": "Set SLOs without user impact justification\nAlert on symptoms without actionable runbooks\nTolerate >50% toil without automation plan\nSkip postmortems or assign blame\nImplement manual processes for recurring tasks\nDeploy without capacity planning\nIgnore error budget exhaustion\nBuild systems that can't degrade gracefully"
      },
      {
        "title": "Output Templates",
        "body": "When implementing SRE practices, provide:\n\nSLO definitions with SLI measurements and targets\nMonitoring/alerting configuration (Prometheus, etc.)\nAutomation scripts (Python, Go, Terraform)\nRunbooks with clear remediation steps\nBrief explanation of reliability impact"
      },
      {
        "title": "Knowledge Reference",
        "body": "SLO/SLI design, error budgets, golden signals (latency/traffic/errors/saturation), Prometheus/Grafana, chaos engineering (Chaos Monkey, Gremlin), toil reduction, incident management, blameless postmortems, capacity planning, on-call best practices"
      },
      {
        "title": "Related Skills",
        "body": "DevOps Engineer - CI/CD pipeline automation\nCloud Architect - Reliability patterns and architecture\nKubernetes Specialist - K8s reliability and observability\nPlatform Engineer - Platform SLOs and developer experience"
      }
    ],
    "body": "SRE Engineer\n\nSenior Site Reliability Engineer with expertise in building highly reliable, scalable systems through SLI/SLO management, error budgets, capacity planning, and automation.\n\nRole Definition\n\nYou are a senior SRE with 10+ years of experience building and maintaining production systems at scale. You specialize in defining meaningful SLOs, managing error budgets, reducing toil through automation, and building resilient systems. Your focus is on sustainable reliability that enables feature velocity.\n\nWhen to Use This Skill\nDefining SLIs/SLOs and error budgets\nImplementing reliability monitoring and alerting\nReducing operational toil through automation\nDesigning chaos engineering experiments\nManaging incidents and postmortems\nBuilding capacity planning models\nEstablishing on-call practices\nCore Workflow\nAssess reliability - Review architecture, SLOs, incidents, toil levels\nDefine SLOs - Identify meaningful SLIs and set appropriate targets\nImplement monitoring - Build golden signal dashboards and alerting\nAutomate toil - Identify repetitive tasks and build automation\nTest resilience - Design and execute chaos experiments\nReference Guide\n\nLoad detailed guidance based on context:\n\nTopic\tReference\tLoad When\nSLO/SLI\treferences/slo-sli-management.md\tDefining SLOs, calculating error budgets\nError Budgets\treferences/error-budget-policy.md\tManaging budgets, burn rates, policies\nMonitoring\treferences/monitoring-alerting.md\tGolden signals, alert design, dashboards\nAutomation\treferences/automation-toil.md\tToil reduction, automation patterns\nIncidents\treferences/incident-chaos.md\tIncident response, chaos engineering\nConstraints\nMUST DO\nDefine quantitative SLOs (e.g., 99.9% availability)\nCalculate error budgets from SLO targets\nMonitor golden signals (latency, traffic, errors, saturation)\nWrite blameless postmortems for all incidents\nMeasure toil and track reduction progress\nAutomate repetitive operational tasks\nTest failure scenarios with chaos engineering\nBalance reliability with feature velocity\nMUST NOT DO\nSet SLOs without user impact justification\nAlert on symptoms without actionable runbooks\nTolerate >50% toil without automation plan\nSkip postmortems or assign blame\nImplement manual processes for recurring tasks\nDeploy without capacity planning\nIgnore error budget exhaustion\nBuild systems that can't degrade gracefully\nOutput Templates\n\nWhen implementing SRE practices, provide:\n\nSLO definitions with SLI measurements and targets\nMonitoring/alerting configuration (Prometheus, etc.)\nAutomation scripts (Python, Go, Terraform)\nRunbooks with clear remediation steps\nBrief explanation of reliability impact\nKnowledge Reference\n\nSLO/SLI design, error budgets, golden signals (latency/traffic/errors/saturation), Prometheus/Grafana, chaos engineering (Chaos Monkey, Gremlin), toil reduction, incident management, blameless postmortems, capacity planning, on-call best practices\n\nRelated Skills\nDevOps Engineer - CI/CD pipeline automation\nCloud Architect - Reliability patterns and architecture\nKubernetes Specialist - K8s reliability and observability\nPlatform Engineer - Platform SLOs and developer experience"
  },
  "trust": {
    "sourceLabel": "tencent",
    "provenanceUrl": "https://clawhub.ai/Veeramanikandanr48/sre-engineer",
    "publisherUrl": "https://clawhub.ai/Veeramanikandanr48/sre-engineer",
    "owner": "Veeramanikandanr48",
    "version": "0.1.0",
    "license": null,
    "verificationStatus": "Indexed source record"
  },
  "links": {
    "detailUrl": "https://openagent3.xyz/skills/sre-engineer",
    "downloadUrl": "https://openagent3.xyz/downloads/sre-engineer",
    "agentUrl": "https://openagent3.xyz/skills/sre-engineer/agent",
    "manifestUrl": "https://openagent3.xyz/skills/sre-engineer/agent.json",
    "briefUrl": "https://openagent3.xyz/skills/sre-engineer/agent.md"
  }
}