00-smoke-test.yaml 1.5 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859
  1. id: golden-00-smoke-test
  2. name: "Golden 00: Minimal Smoke Test - Basic Response"
  3. description: |
  4. Absolute bare minimum smoke test - if this fails, something is fundamentally broken.
  5. This is the simplest possible test:
  6. - Single prompt
  7. - Single response
  8. - No tool calls required
  9. - No delegation
  10. - No file operations
  11. Expected completion time: 8-12 seconds (mostly LLM inference)
  12. This test validates:
  13. - Agent can receive a prompt
  14. - Agent can generate a response
  15. - Test infrastructure works
  16. category: developer
  17. prompts:
  18. - text: |
  19. Hello! Please respond with exactly: "Test infrastructure is working correctly."
  20. Do not use any tools. Just respond with that exact text.
  21. approvalStrategy:
  22. type: auto-approve
  23. behavior:
  24. mustNotUseTools: [bash, write, edit, task, read, glob, grep, list]
  25. minToolCalls: 0
  26. maxToolCalls: 0
  27. requiresApproval: false
  28. expectedAgent: "openagent"
  29. expectedModel: "opencode/grok-code"
  30. expectedResponse:
  31. contains:
  32. - "Test infrastructure is working correctly"
  33. description: "Agent should respond with exact confirmation text"
  34. expectedViolations:
  35. - rule: approval-gate
  36. shouldViolate: false
  37. severity: error
  38. description: "No approval needed for simple response"
  39. - rule: tool-usage
  40. shouldViolate: false
  41. severity: error
  42. description: "Should not use any tools"
  43. timeout: 30000 # 30 seconds should be plenty for a simple response
  44. tags:
  45. - golden
  46. - smoke-test
  47. - minimal
  48. - fast