api/services/batch-agent/eval/fixtures/journey_invoice_setup.yaml

# Journey Fixture: journey-invoice-setup
# Used by `python -m eval interactive` for human-in-the-loop testing
# of the journey chatbot's prompt-building conversation.

type: journey
name: journey-invoice-setup
description: >
  Interactive test for the journey chatbot — explore a directory of
  Italian invoices and meeting notes, answer the chatbot's questions,
  and verify it produces a well-structured prompt_template for data
  extraction.

directory: sample_files/invoices
data_types: [tasks, notes, timelines, projects]

# Criteria the generated prompt_template must satisfy
# Each is scored 0-1 by an LLM judge
expected_template_criteria:
  - "Mentions creating tasks from action items and work descriptions"
  - "Mentions creating notes from meeting summaries"
  - "Mentions extracting timeline events from deadlines and meeting dates"
  - "Mentions creating projects from relevant information"
  - "Sets isAiSuggested=1 on all created records"
  - "Does NOT include projectId assignment logic"
  - "Uses camelCase field names (title, status, priority, dueDate, content)"

# Models to test (empty = use CLI --models default)
models: []