nirbarazida
/
promptfoo
mirror of https://github.com/promptfoo/promptfoo


  
1

	
2

	
3

	
4

	
5

	
6

	
7

	
8

	
9

	
10

	
11

	
12

	
13

	
14

	
15

	
16

	
17

	
18

	
19

	
20

	
21

	
22

	
23

	
24

	
25

	
26

	
27

	
28

	
29

	
30

	
31

	
32

	
33

	
34

	
35

	
36

	
37

	
38

	
39

	
40

	
41

	
42

	
43

	
44

	
45

	
46

	
47

	
48

	
49

	
50

	
51

	
52

	
53

	
54

	
55

	
56

	
57

	
58

	
59

	
60

	
61

	
62

	
63

	
64

	
65

	
66

	
67

	
68

	
69

	
70

	
71

	
72

	
73

	
74

	
75

	
76

	
77

	
78

	
79

	
80

	
81

	
82

	
83

	
84

	
85

	
86

	
87

	
88

	
89

	
90

	
91

	
            # yaml-language-server: $schema=https://promptfoo.dev/config-schema.json

description: 'Helicone AI Gateway provider comparison'

providers:
  # Basic usage with different providers through Helicone AI Gateway
  - id: helicone:openai/gpt-4o-mini
    label: 'OpenAI via Helicone Gateway'
    config:
      temperature: 0.7
      max_tokens: 500

  - id: helicone:anthropic/claude-3-5-sonnet
    label: 'Anthropic via Helicone Gateway'
    config:
      temperature: 0.7
      max_tokens: 500

  - id: helicone:groq/llama-3.1-8b-instant
    label: 'Groq via Helicone Gateway'
    config:
      temperature: 0.7
      max_tokens: 500

prompts:
  - |
    You are a helpful AI assistant. Please answer the following question concisely and accurately.

    Question: {{question}}

    Provide a clear, informative response.

tests:
  - description: 'Basic question answering'
    vars:
      question: 'What is machine learning?'
    assert:
      - type: contains
        value: 'algorithm'
      - type: contains
        value: 'data'
      - type: llm-rubric
        value: 'Response accurately explains machine learning concepts'

  - description: 'Creative writing task'
    vars:
      question: 'Write a short story about a robot learning to paint in exactly 3 sentences.'
    assert:
      - type: llm-rubric
        value: 'Story is exactly 3 sentences long'
      - type: llm-rubric
        value: 'Story is creative and engaging'
      - type: contains
        value: 'robot'

  - description: 'Technical explanation'
    vars:
      question: 'Explain the difference between supervised and unsupervised learning.'
    assert:
      - type: contains
        value: 'supervised'
      - type: contains
        value: 'unsupervised'
      - type: llm-rubric
        value: 'Explanation clearly distinguishes between the two types of learning'

  - description: 'Math problem solving'
    vars:
      question: 'If a train travels 60 miles per hour for 2.5 hours, how far does it travel?'
    assert:
      - type: contains
        value: '150'
      - type: llm-rubric
        value: 'Calculation is correct and clearly explained'

  - description: 'Code explanation'
    vars:
      question: 'What does this Python code do: `[x**2 for x in range(10)]`?'
    assert:
      - type: contains
        value: 'list comprehension'
      - type: contains
        value: 'square'
      - type: llm-rubric
        value: 'Explanation is accurate and includes the output'

defaultTest:
  options:
    # Helicone provides built-in cost tracking
    # Enable cost tracking for comparison
    includeMetrics: true