generated from actions/typescript-action
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathaction.yml
70 lines (66 loc) · 1.9 KB
/
action.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
name: 'HoneyHive Evaluation'
description: 'Evaluations for LLM applications'
author: 'HoneyHive'
branding:
icon: 'check-square'
color: 'yellow'
inputs:
root:
description: 'The root directory of the evaluation'
required: false
default: '.'
runtime:
description: 'The runtime to use for the evaluation'
required: true
runId:
description: 'The ID of the run to evaluate'
required: true
project:
description: 'The project associated with the evaluation'
required: true
aggregateFunction:
description:
'The function used for aggregating the evaluation results (e.g., average,
min, max, etc.)'
required: false
default: 'average'
apiUrl:
description: 'The base URL of the Honeyhive API'
required: false
default: 'https://api.honeyhive.ai'
apiKey:
description: 'The API key for the Honeyhive API'
required: true
openaiApiKey:
description: 'The API key for the OpenAI API'
required: true
github_token:
description: 'Your GitHub token'
required: true
default: ${{ github.token }}
step_key:
description:
"A unique key to identify this step. Do not change this unless you know
what you're doing."
required: true
default: ${{ github.workflow_ref }}-${{ github.action }}
outputs:
status:
description: 'The status of the evaluation run (e.g., pending or completed)'
success:
description: 'Whether all datapoints have passed (true or false)'
passed:
description: 'List of passed datapoint_ids or session_ids'
failed:
description: 'List of failed datapoint_ids or session_ids'
metrics:
description:
'Metric level aggregates and details of passed/failed status for each
metric'
datapoints:
description:
'Details of each datapoint with associated session_id, pass status, and
metric-level pass/fail status'
runs:
using: node20
main: dist/index.js