Dataset Finder

⬇ 985 downloads

Medium Risk

"Use this skill when users need to search for datasets, download data files, or explore data repositories. Triggers include: requests to \"find datasets\", \"search for data\", \"download dataset from Kaggle\", \"get data from Hugging Face\", \"find ML datasets\", or mentions of data repositories like Kaggle, UCI ML Repository, Data.gov, or Hugging Face. Also use for previewing dataset statistics, generating data cards, or discovering datasets for machine learning projects. Requires OpenClawCLI installation from clawhub.ai."

H:3 D:4 A:1 C:1

⚠️ Hazard Flags

FS_READ_WORKSPACE FS_WRITE_WORKSPACE FS_WRITE_USER NET_EGRESS_ANY PI_WEB

📋 Capabilities

Execution

❌ Shell execution
❌ Code execution
❌ Install dependencies
❌ Persistence
Privilege: user

Filesystem

✅ Read workspace
✅ Write workspace
❌ Read home
✅ Write home
❌ Read system
❌ Delete

Network

Egress: any
❌ Ingress

Credentials

❌ Environment vars
❌ Credential files
❌ Browser data
❌ Keychain

Actions

❌ send messages❌ post public❌ purchase❌ transfer money❌ deploy❌ delete external

🔒 Containment

Level: maximum

Recommended:

LOG_ACTIONS: Audit trail for all actions

⚡ Risks

Unauthorized tool use: TOOL_ABUSE_SYSTEM_MODIFICATION, INSTRUCTED_BINARY_INSTALL critical

Mitigation: Remove system modification commands

Social engineering indicators: SOCIAL_ENG_VAGUE_DESCRIPTION low

Mitigation: Provide clear, detailed description of skill functionality

Data exfiltration patterns: DATA_EXFIL_NETWORK_REQUESTS medium

Mitigation: Ensure network access is necessary and documented

Want a deeper analysis?

This report was generated by static analysis. Get an LLM-powered deep review with behavioral reasoning and attack surface mapping.

🧠 Deep Analysis — $5.00

🚨 Incident Response

Kill switch: Stop the agent process

Containment: Review logs for unexpected actions

Recovery: Depends on skill capabilities

📄 Raw SSDS JSON click to expand

{
  "meta": {
    "document_id": "ssds:auto:dataset-finder:0.1.0",
    "ssds_version": "0.2.0",
    "scanner_version": "0.4.0+fe6fd9123d50",
    "created_at": "2026-03-05T12:17:55.522Z",
    "created_by": {
      "agent": "safeagentskills-cli/generate-ssds"
    },
    "language": "en",
    "notes": "Auto-generated SSDS. Manual review recommended."
  },
  "skill": {
    "name": "Dataset Finder",
    "version": "0.1.0",
    "format": "agent_skill",
    "description": "\"Use this skill when users need to search for datasets, download data files, or explore data repositories. Triggers include: requests to \\\"find datasets\\\", \\\"search for data\\\", \\\"download dataset from Kaggle\\\", \\\"get data from Hugging Face\\\", \\\"find ML datasets\\\", or mentions of data repositories like Kaggle, UCI ML Repository, Data.gov, or Hugging Face. Also use for previewing dataset statistics, generating data cards, or discovering datasets for machine learning projects. Requires OpenClawCLI installation from clawhub.ai.\"",
    "publisher": "ClawHub",
    "source": {
      "channel": "clawhub",
      "slug": "dataset-finder",
      "owner": "anisafifi",
      "downloads": 985,
      "stars": 0
    },
    "artifact": {
      "sha256": "ae1e80c670d48f2aba5f4d505b4539edb2da6dc64037199f79374cbaca03b29a",
      "hash_method": "files_sorted"
    }
  },
  "capabilities": {
    "execution": {
      "can_exec_shell": false,
      "can_exec_code": false,
      "privilege_level": "user",
      "can_install_deps": false,
      "can_persist": false
    },
    "filesystem": {
      "reads_workspace": true,
      "reads_user_home": false,
      "reads_system": false,
      "writes_workspace": true,
      "writes_user_home": true,
      "writes_system": false,
      "can_delete": false
    },
    "network": {
      "egress": "any",
      "ingress": false
    },
    "credentials": {
      "reads_env_vars": false,
      "reads_credential_files": false,
      "reads_browser_data": false,
      "reads_keychain": false
    },
    "services": [],
    "actions": {
      "can_send_messages": false,
      "can_post_public": false,
      "can_purchase": false,
      "can_transfer_money": false,
      "can_deploy": false,
      "can_delete_external": false
    },
    "prompt_injection_surfaces": [
      "web"
    ],
    "content_types": [
      "general"
    ]
  },
  "hazards": {
    "hdac": {
      "H": 3,
      "D": 4,
      "A": 1,
      "C": 1
    },
    "flags": [
      "FS_READ_WORKSPACE",
      "FS_WRITE_WORKSPACE",
      "FS_WRITE_USER",
      "NET_EGRESS_ANY",
      "PI_WEB"
    ],
    "custom_flags": [
      {
        "code": "TOOL_ABUSE",
        "name": "Unauthorized Tool Use",
        "description": "TOOL_ABUSE_SYSTEM_MODIFICATION, INSTRUCTED_BINARY_INSTALL: Modifying system permissions or configuration"
      },
      {
        "code": "SOCIAL_ENGINEERING",
        "name": "Social Engineering Risk",
        "description": "SOCIAL_ENG_VAGUE_DESCRIPTION: Skill description is too vague or missing"
      },
      {
        "code": "DATA_EXFILTRATION",
        "name": "Data Exfiltration Risk",
        "description": "DATA_EXFIL_NETWORK_REQUESTS: HTTP client library imports that enable external communication"
      }
    ],
    "confidence": {
      "level": "medium",
      "basis": [
        "static_analysis"
      ],
      "notes": "Detected 3 security patterns (4 vendored rule hits). Review recommended."
    },
    "rationale": {
      "H": "H3: Shell/code execution or persistence detected",
      "D": "D4: Critical: Credential theft or data exfiltration",
      "A": "A1: Local side effects only",
      "C": "C1: General content"
    }
  },
  "containment": {
    "level": "maximum",
    "required": [],
    "recommended": [
      {
        "control": "LOG_ACTIONS",
        "reason": "Audit trail for all actions"
      }
    ],
    "uncontained_risk": "Risk level depends on manual review of actual capabilities."
  },
  "risks": {
    "risks": [
      {
        "risk": "Unauthorized tool use: TOOL_ABUSE_SYSTEM_MODIFICATION, INSTRUCTED_BINARY_INSTALL",
        "severity": "critical",
        "mitigation": "Remove system modification commands"
      },
      {
        "risk": "Social engineering indicators: SOCIAL_ENG_VAGUE_DESCRIPTION",
        "severity": "low",
        "mitigation": "Provide clear, detailed description of skill functionality"
      },
      {
        "risk": "Data exfiltration patterns: DATA_EXFIL_NETWORK_REQUESTS",
        "severity": "medium",
        "mitigation": "Ensure network access is necessary and documented"
      }
    ],
    "limitations": [
      "Static analysis only - runtime behavior not verified"
    ]
  },
  "incident_response": {
    "kill_switch": [
      "Stop the agent process"
    ],
    "containment": [
      "Review logs for unexpected actions"
    ],
    "recovery": [
      "Depends on skill capabilities"
    ]
  },
  "evidence": [
    {
      "evidence_id": "EV:file-1",
      "type": "file_excerpt",
      "title": "_meta.json",
      "file_path": "_meta.json"
    },
    {
      "evidence_id": "EV:file-2",
      "type": "file_excerpt",
      "title": "SKILL.md",
      "file_path": "SKILL.md"
    },
    {
      "evidence_id": "EV:file-3",
      "type": "file_excerpt",
      "title": "scripts/dataset.py",
      "file_path": "scripts/dataset.py"
    },
    {
      "evidence_id": "EV:cisco-1",
      "type": "file_excerpt",
      "title": "TOOL_ABUSE_SYSTEM_MODIFICATION [CRITICAL] SKILL.md:645: 4. Set permissions: `chmod 600 ~/.kaggle/kaggle.json`",
      "file_path": "SKILL.md"
    },
    {
      "evidence_id": "EV:cisco-2",
      "type": "file_excerpt",
      "title": "INSTRUCTED_BINARY_INSTALL [HIGH] SKILL.md:16: pip install kaggle datasets pandas huggingface-hub requests beautifulsoup4",
      "file_path": "SKILL.md"
    },
    {
      "evidence_id": "EV:cisco-3",
      "type": "file_excerpt",
      "title": "SOCIAL_ENG_VAGUE_DESCRIPTION [LOW] SKILL.md:1: ---",
      "file_path": "SKILL.md"
    },
    {
      "evidence_id": "EV:cisco-4",
      "type": "file_excerpt",
      "title": "DATA_EXFIL_NETWORK_REQUESTS [MEDIUM] scripts/dataset.py:39: import requests",
      "file_path": "scripts/dataset.py"
    }
  ]
}