AutoPilot-TaskMate-Commons / examples / data-validation.json
data-validation.json
Raw
{
  "task": "data-validation",
  "description": "Validate spreadsheet data for duplicates, missing fields, and format errors",
  "use_case": "Logistics company imports 500+ shipping records daily. Manual checks take 3-5 hours/week. Automation saves 200+ hours/year.",
  
  "request": {
    "endpoint": "/tasks/data-validation",
    "method": "POST",
    "content_type": "multipart/form-data",
    "body": {
      "file": "shipping_records_20260119.csv",
      "rules": [
        "no_duplicates",
        "required_fields",
        "email_format",
        "date_format",
        "numeric_validation"
      ],
      "required_fields": [
        "tracking_number",
        "customer_email",
        "delivery_date",
        "weight_kg"
      ]
    }
  },
  
  "response": {
    "task_id": "val_20260119_def456",
    "status": "completed",
    "validation_result": {
      "total_rows": 500,
      "valid_rows": 485,
      "invalid_rows": 15,
      "validation_rate": 97.0,
      "errors": [
        {
          "row": 42,
          "field": "customer_email",
          "value": "invalid-email",
          "error": "Invalid email format",
          "severity": "high"
        },
        {
          "row": 108,
          "field": "delivery_date",
          "value": "2026-13-45",
          "error": "Invalid date format",
          "severity": "high"
        },
        {
          "row": 234,
          "field": "weight_kg",
          "value": "ABC",
          "error": "Expected numeric value",
          "severity": "medium"
        }
      ],
      "duplicates": [
        {
          "rows": [23, 67],
          "field": "tracking_number",
          "value": "TRK123456789",
          "severity": "critical"
        },
        {
          "rows": [145, 289],
          "field": "tracking_number",
          "value": "TRK987654321",
          "severity": "critical"
        }
      ],
      "missing_fields": [
        {
          "row": 321,
          "field": "customer_email",
          "severity": "high"
        }
      ]
    },
    "confidence": 0.99,
    "processing_time_ms": 2340
  },
  
  "corrective_actions": {
    "description": "Suggested fixes for common errors",
    "suggestions": [
      {
        "row": 42,
        "field": "customer_email",
        "suggested_value": "customer@example.com",
        "confidence": 0.75
      }
    ]
  },
  
  "integration_example": {
    "description": "Validate before importing to database",
    "code": "curl -X POST https://api.example.com/v1/tasks/data-validation \\\n  -F 'file=@data.csv' \\\n  -F 'rules=[\"no_duplicates\",\"required_fields\"]'"
  },
  
  "sme_benefit": {
    "time_saved_per_batch": "30 minutes",
    "daily_batches": 2,
    "annual_savings_hours": 200,
    "cost_savings_eur": 4000,
    "error_reduction": "95%"
  }
}