# Journey Fixture: journey-invoice-setup # Used by `python -m eval interactive` for human-in-the-loop testing # of the journey chatbot's prompt-building conversation. type: journey name: journey-invoice-setup description: > Interactive test for the journey chatbot — explore a directory of Italian invoices and meeting notes, answer the chatbot's questions, and verify it produces a well-structured prompt_template for data extraction. directory: sample_files/invoices data_types: [tasks, notes, timelines, projects] # Criteria the generated prompt_template must satisfy # Each is scored 0-1 by an LLM judge expected_template_criteria: - "Mentions creating tasks from action items and work descriptions" - "Mentions creating notes from meeting summaries" - "Mentions extracting timeline events from deadlines and meeting dates" - "Mentions creating projects from relevant information" - "Sets isAiSuggested=1 on all created records" - "Does NOT include projectId assignment logic" - "Uses camelCase field names (title, status, priority, dueDate, content)" # Models to test (empty = use CLI --models default) models: []