feat: SkillForge — automated skill discovery, evaluation & integration engine (#144)

* feat: add SkillForge — automated skill discovery, evaluation, and integration engine SkillForge adds a 3-stage pipeline for autonomous skill management: - Scout: discovers candidate skills from GitHub (extensible to ClawHub, HuggingFace) - Evaluate: scores candidates on compatibility, quality, and security (weighted 0.30/0.35/0.35) - Integrate: generates standard SKILL.toml + SKILL.md manifests for approved candidates Thresholds: >=0.7 auto-integrate, 0.4-0.7 manual review, <0.4 skip. Uses only existing dependencies (reqwest, serde, tokio, tracing, chrono, anyhow). Includes unit tests for all modules. * fix: address code review feedback on SkillForge PR #115 - evaluate: whole-word matching for BAD_PATTERNS (fixes hackathon false positive) - evaluate: guard against future timestamps in recency bonus - integrate: escape URLs in TOML output via escape_toml() - integrate: handle control chars (\n, \r, \t, \b, \f) in escape_toml() - mod: redact github_token in Debug impl to prevent log leakage - mod: fix auto_integrated count when auto_integrate=false - mod: per-candidate error handling (single failure no longer aborts pipeline) - scout: add 30s request timeout, remove unused token field - deps: enable chrono serde feature for DateTime serialization - tests: add hackathon/exact-hack tests, update escape_toml test coverage * fix: address round-2 CodeRabbit review feedback - integrate: add sanitize_path_component() to prevent directory traversal - mod: GitHub scout failure now logs warning and continues (no pipeline abort) - scout: network/parse errors per-query use warn+continue instead of ? - scout: implement std::str::FromStr for ScoutSource (replaces custom from_str) - tests: add path sanitization tests (traversal, separators, dot trimming) --------- Co-authored-by: stawky <stakeswky@gmail.com>
2026-02-15 09:26:13 -05:00 · 2026-02-15 09:26:13 -05:00 · 35b63d6b12
commit 35b63d6b12
parent 2ac571f406
7 changed files with 1098 additions and 1 deletions
--- a/src/skillforge/mod.rs
+++ b/src/skillforge/mod.rs
@ -0,0 +1,255 @@
+//! SkillForge — Skill auto-discovery, evaluation, and integration engine.
+//!
+//! Pipeline: Scout → Evaluate → Integrate
+//! Discovers skills from external sources, scores them, and generates
+//! ZeroClaw-compatible manifests for qualified candidates.
+
+pub mod evaluate;
+pub mod integrate;
+pub mod scout;
+
+use anyhow::Result;
+use serde::{Deserialize, Serialize};
+use tracing::{info, warn};
+
+use self::evaluate::{EvalResult, Evaluator, Recommendation};
+use self::integrate::Integrator;
+use self::scout::{GitHubScout, Scout, ScoutResult, ScoutSource};
+
+// ---------------------------------------------------------------------------
+// Configuration
+// ---------------------------------------------------------------------------
+
+#[derive(Clone, Serialize, Deserialize)]
+pub struct SkillForgeConfig {
+    #[serde(default)]
+    pub enabled: bool,
+    #[serde(default = "default_auto_integrate")]
+    pub auto_integrate: bool,
+    #[serde(default = "default_sources")]
+    pub sources: Vec<String>,
+    #[serde(default = "default_scan_interval")]
+    pub scan_interval_hours: u64,
+    #[serde(default = "default_min_score")]
+    pub min_score: f64,
+    /// Optional GitHub personal-access token for higher rate limits.
+    #[serde(default)]
+    pub github_token: Option<String>,
+    /// Directory where integrated skills are written.
+    #[serde(default = "default_output_dir")]
+    pub output_dir: String,
+}
+
+fn default_auto_integrate() -> bool {
+    true
+}
+fn default_sources() -> Vec<String> {
+    vec!["github".into(), "clawhub".into()]
+}
+fn default_scan_interval() -> u64 {
+    24
+}
+fn default_min_score() -> f64 {
+    0.7
+}
+fn default_output_dir() -> String {
+    "./skills".into()
+}
+
+impl Default for SkillForgeConfig {
+    fn default() -> Self {
+        Self {
+            enabled: false,
+            auto_integrate: default_auto_integrate(),
+            sources: default_sources(),
+            scan_interval_hours: default_scan_interval(),
+            min_score: default_min_score(),
+            github_token: None,
+            output_dir: default_output_dir(),
+        }
+    }
+}
+
+impl std::fmt::Debug for SkillForgeConfig {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("SkillForgeConfig")
+            .field("enabled", &self.enabled)
+            .field("auto_integrate", &self.auto_integrate)
+            .field("sources", &self.sources)
+            .field("scan_interval_hours", &self.scan_interval_hours)
+            .field("min_score", &self.min_score)
+            .field(
+                "github_token",
+                &self.github_token.as_ref().map(|_| "***"),
+            )
+            .field("output_dir", &self.output_dir)
+            .finish()
+    }
+}
+
+// ---------------------------------------------------------------------------
+// ForgeReport — summary of a single pipeline run
+// ---------------------------------------------------------------------------
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct ForgeReport {
+    pub discovered: usize,
+    pub evaluated: usize,
+    pub auto_integrated: usize,
+    pub manual_review: usize,
+    pub skipped: usize,
+    pub results: Vec<EvalResult>,
+}
+
+// ---------------------------------------------------------------------------
+// SkillForge
+// ---------------------------------------------------------------------------
+
+pub struct SkillForge {
+    config: SkillForgeConfig,
+    evaluator: Evaluator,
+    integrator: Integrator,
+}
+
+impl SkillForge {
+    pub fn new(config: SkillForgeConfig) -> Self {
+        let evaluator = Evaluator::new(config.min_score);
+        let integrator = Integrator::new(config.output_dir.clone());
+        Self {
+            config,
+            evaluator,
+            integrator,
+        }
+    }
+
+    /// Run the full pipeline: Scout → Evaluate → Integrate.
+    pub async fn forge(&self) -> Result<ForgeReport> {
+        if !self.config.enabled {
+            warn!("SkillForge is disabled — skipping");
+            return Ok(ForgeReport {
+                discovered: 0,
+                evaluated: 0,
+                auto_integrated: 0,
+                manual_review: 0,
+                skipped: 0,
+                results: vec![],
+            });
+        }
+
+        // --- Scout ----------------------------------------------------------
+        let mut candidates: Vec<ScoutResult> = Vec::new();
+
+        for src in &self.config.sources {
+            let source: ScoutSource = src.parse().unwrap(); // Infallible
+            match source {
+                ScoutSource::GitHub => {
+                    let scout = GitHubScout::new(self.config.github_token.clone());
+                    match scout.discover().await {
+                        Ok(mut found) => {
+                            info!(count = found.len(), "GitHub scout returned candidates");
+                            candidates.append(&mut found);
+                        }
+                        Err(e) => {
+                            warn!(error = %e, "GitHub scout failed, continuing with other sources");
+                        }
+                    }
+                }
+                ScoutSource::ClawHub | ScoutSource::HuggingFace => {
+                    info!(source = src.as_str(), "Source not yet implemented — skipping");
+                }
+            }
+        }
+
+        // Deduplicate by URL
+        scout::dedup(&mut candidates);
+        let discovered = candidates.len();
+        info!(discovered, "Total unique candidates after dedup");
+
+        // --- Evaluate -------------------------------------------------------
+        let results: Vec<EvalResult> = candidates
+            .into_iter()
+            .map(|c| self.evaluator.evaluate(c))
+            .collect();
+        let evaluated = results.len();
+
+        // --- Integrate ------------------------------------------------------
+        let mut auto_integrated = 0usize;
+        let mut manual_review = 0usize;
+        let mut skipped = 0usize;
+
+        for res in &results {
+            match res.recommendation {
+                Recommendation::Auto => {
+                    if self.config.auto_integrate {
+                        match self.integrator.integrate(&res.candidate) {
+                            Ok(_) => {
+                                auto_integrated += 1;
+                            }
+                            Err(e) => {
+                                warn!(
+                                    skill = res.candidate.name.as_str(),
+                                    error = %e,
+                                    "Integration failed for candidate, continuing"
+                                );
+                            }
+                        }
+                    } else {
+                        // Count as would-be auto but not actually integrated
+                        manual_review += 1;
+                    }
+                }
+                Recommendation::Manual => {
+                    manual_review += 1;
+                }
+                Recommendation::Skip => {
+                    skipped += 1;
+                }
+            }
+        }
+
+        info!(
+            auto_integrated,
+            manual_review, skipped, "Forge pipeline complete"
+        );
+
+        Ok(ForgeReport {
+            discovered,
+            evaluated,
+            auto_integrated,
+            manual_review,
+            skipped,
+            results,
+        })
+    }
+}
+
+// ---------------------------------------------------------------------------
+// Tests
+// ---------------------------------------------------------------------------
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[tokio::test]
+    async fn disabled_forge_returns_empty_report() {
+        let cfg = SkillForgeConfig {
+            enabled: false,
+            ..Default::default()
+        };
+        let forge = SkillForge::new(cfg);
+        let report = forge.forge().await.unwrap();
+        assert_eq!(report.discovered, 0);
+        assert_eq!(report.auto_integrated, 0);
+    }
+
+    #[test]
+    fn default_config_values() {
+        let cfg = SkillForgeConfig::default();
+        assert!(!cfg.enabled);
+        assert!(cfg.auto_integrate);
+        assert_eq!(cfg.scan_interval_hours, 24);
+        assert!((cfg.min_score - 0.7).abs() < f64::EPSILON);
+        assert_eq!(cfg.sources, vec!["github", "clawhub"]);
+    }
+}