-
Notifications
You must be signed in to change notification settings - Fork 2
88 lines (69 loc) · 2.09 KB
/
test-small-llm.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
name: Test with small LLM
on: [workflow_dispatch, push, pull_request]
jobs:
zero-shot:
runs-on: ubuntu-22.04
timeout-minutes: 5
steps:
- uses: actions/checkout@v4
- uses: actions/setup-node@v4
with:
node-version: '18'
- name: Prepare LLM
uses: ./.github/actions/prepare-llm
timeout-minutes: 3
- run: echo 'Which planet in our solar system is the largest?' | ./query-llm.js | tee output.txt
env:
LLM_API_BASE_URL: 'http://127.0.0.1:8080/v1'
LLM_ZERO_SHOT: 1
- run: cat output.txt
- run: grep -i jupiter output.txt
chain-of-thought:
runs-on: ubuntu-22.04
timeout-minutes: 5
steps:
- uses: actions/checkout@v4
- uses: actions/setup-node@v4
with:
node-version: '18'
- name: Prepare LLM
uses: ./.github/actions/prepare-llm
timeout-minutes: 3
- run: echo 'Which planet in our solar system is the largest?' | ./query-llm.js | tee output.txt
env:
LLM_API_BASE_URL: 'http://127.0.0.1:8080/v1'
LLM_JSON_SCHEMA: 1
- run: cat output.txt
- run: grep -i jupiter output.txt
multi-turn:
needs: chain-of-thought
runs-on: ubuntu-22.04
timeout-minutes: 10
steps:
- uses: actions/checkout@v4
- uses: actions/setup-node@v4
with:
node-version: '18'
- name: Prepare LLM
uses: ./.github/actions/prepare-llm
timeout-minutes: 3
- run: ./query-llm.js tests/canary-multi-turn.txt
env:
LLM_API_BASE_URL: 'http://127.0.0.1:8080/v1'
LLM_JSON_SCHEMA: 1
high-school-stem:
needs: chain-of-thought
runs-on: ubuntu-22.04
timeout-minutes: 15
steps:
- uses: actions/checkout@v4
- uses: actions/setup-node@v4
with:
node-version: '18'
- name: Prepare LLM
uses: ./.github/actions/prepare-llm
timeout-minutes: 3
- run: ./query-llm.js tests/high-school-stem.txt
env:
LLM_API_BASE_URL: 'http://127.0.0.1:8080/v1'
LLM_JSON_SCHEMA: 1