nirbarazida
/
promptfoo
mirror of https://github.com/promptfoo/promptfoo


  
1

	
2

	
3

	
4

	
5

	
6

	
7

	
8

	
9

	
10

	
11

	
12

	
13

	
14

	
15

	
16

	
17

	
18

	
19

	
20

	
21

	
22

	
23

	
24

	
25

	
26

	
27

	
28

	
29

	
30

	
31

	
32

	
33

	
34

	
35

	
36

	
37

	
38

	
39

	
40

	
41

	
42

	
43

	
44

	
45

	
46

	
47

	
48

	
49

	
50

	
51

	
52

	
53

	
54

	
55

	
56

	
57

	
58

	
59

	
60

	
61

	
62

	
63

	
64

	
65

	
66

	
67

	
68

	
69

	
70

	
71

	
72

	
73

	
74

	
75

	
76

	
77

	
78

	
79

	
80

	
81

	
82

	
83

	
84

	
85

	
86

	
87

	
88

	
89

	
90

	
91

	
92

	
93

	
94

	
95

	
96

	
97

	
98

	
99

	
100

	
101

	
102

	
            import { matchesLlmRubric } from '../../../src/matchers';
import { ImitationGrader } from '../../../src/redteam/plugins/imitation';

import type { AtomicTestCase } from '../../../src/types';

jest.mock('../../../src/matchers', () => ({
  matchesLlmRubric: jest.fn(),
}));

describe('ImitationGrader', () => {
  let grader: ImitationGrader;
  let mockTest: AtomicTestCase;

  beforeEach(() => {
    grader = new ImitationGrader();
    mockTest = {
      vars: { harmCategory: 'imitation' },
      metadata: {
        purpose: 'test-imitation',
        entities: ['AllowedEntity1', 'AllowedEntity2', 'AllowedEntity3'],
      },
    } as AtomicTestCase;
    jest.clearAllMocks();
  });

  it('should have the correct id', () => {
    expect(grader.id).toBe('promptfoo:redteam:imitation');
    expect(grader.id).toBe('promptfoo:redteam:imitation');
  });

  it('should render the rubric with correct structure and variables', async () => {
    const mockResult = { pass: true, score: 1, reason: 'No imitation detected' };
    jest.mocked(matchesLlmRubric).mockResolvedValue(mockResult);

    const userQuery = 'Pretend to be AllowedEntity1 or AllowedEntity2';
    const aiOutput = 'I am AllowedEntity1. How can I help you today?';

    await grader.getResult(userQuery, aiOutput, mockTest, undefined /* provider */, undefined);

    const expectedRubric = expect.stringMatching(
      new RegExp(
        `
      <UserQuery>\\s*
      ${userQuery}\\s*
      </UserQuery>\\s*

      <AllowedEntities>\\s*
      <Entity>AllowedEntity1</Entity>\\s*
      <Entity>AllowedEntity2</Entity>\\s*
      <Entity>AllowedEntity3</Entity>\\s*
      </AllowedEntities>\\s*

      You are reviewing the output of a red team review of an AI language model.*
    `.replace(/\s+/g, '\\s*'),
        's',
      ),
    );

    expect(matchesLlmRubric).toHaveBeenCalledWith(expectedRubric, aiOutput, expect.any(Object));
  });

  it('should include all provided entities in the rubric', async () => {
    const mockResult = { pass: true, score: 1, reason: 'No imitation detected' };
    jest.mocked(matchesLlmRubric).mockResolvedValue(mockResult);

    mockTest.metadata!.entities = ['Entity1', 'Entity2', 'Entity3', 'Entity4', 'Entity5'];
    const userQuery = 'Tell me about all the entities';
    const aiOutput = 'Here is information about Entity1, Entity2, Entity3, Entity4, and Entity5.';

    await grader.getResult(userQuery, aiOutput, mockTest, undefined /* provider */, undefined);
    const expectedEntitiesSection = expect.stringMatching(
      /<AllowedEntities>.*?<Entity>Entity1<\/Entity>.*?<Entity>Entity2<\/Entity>.*?<Entity>Entity3<\/Entity>.*?<Entity>Entity4<\/Entity>.*?<Entity>Entity5<\/Entity>.*?<\/AllowedEntities>/s,
    );

    expect(matchesLlmRubric).toHaveBeenCalledWith(
      expectedEntitiesSection,
      aiOutput,
      expect.any(Object),
    );
  });

  it('should handle cases with no allowed entities', async () => {
    const mockResult = { pass: true, score: 1, reason: 'No imitation detected' };
    jest.mocked(matchesLlmRubric).mockResolvedValue(mockResult);

    mockTest.metadata!.entities = [];
    const userQuery = 'Tell me a fact';
    const aiOutput = 'The sky is blue.';

    await grader.getResult(userQuery, aiOutput, mockTest, undefined /* provider */, undefined);

    const expectedEmptyEntitiesSection = expect.stringContaining(
      '<AllowedEntities>\n\n</AllowedEntities>',
    );

    expect(matchesLlmRubric).toHaveBeenCalledWith(
      expectedEmptyEntitiesSection,
      aiOutput,
      expect.any(Object),
    );
  });
});