Skip to content

Commit ab93dfe

Browse files
committed
add: tests.json for RunPod deployment validation
Define explicit test cases for RunPod's testing phase: - Basic inference test to verify worker startup - Structured outputs test to validate new API functionality This should resolve the indefinite 'testing' phase hang by providing concrete pass/fail criteria instead of relying only on health checks.
1 parent db9553c commit ab93dfe

File tree

1 file changed

+52
-0
lines changed

1 file changed

+52
-0
lines changed

tests.json

Lines changed: 52 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,52 @@
1+
{
2+
"tests": [
3+
{
4+
"name": "basic_inference",
5+
"input": {
6+
"prompt": "Say hello in one word.",
7+
"sampling_params": {
8+
"max_tokens": 10,
9+
"temperature": 0.1
10+
}
11+
},
12+
"timeout": 120000
13+
},
14+
{
15+
"name": "structured_outputs_json_schema",
16+
"input": {
17+
"messages": [
18+
{
19+
"role": "system",
20+
"content": "You are a helpful assistant."
21+
},
22+
{
23+
"role": "user",
24+
"content": "Analyze: The Eiffel Tower was completed in 1889 for the World's Fair."
25+
}
26+
],
27+
"sampling_params": {
28+
"max_tokens": 200,
29+
"temperature": 0.1,
30+
"extra_body": {
31+
"structured_outputs": {
32+
"json": {
33+
"type": "object",
34+
"properties": {
35+
"reasoning": {"type": "string"},
36+
"question": {"type": "string"}
37+
},
38+
"required": ["reasoning", "question"]
39+
}
40+
}
41+
}
42+
}
43+
},
44+
"timeout": 120000
45+
}
46+
],
47+
"config": {
48+
"gpuTypeId": "NVIDIA RTX A4000",
49+
"gpuCount": 1,
50+
"env": []
51+
}
52+
}

0 commit comments

Comments
 (0)