Skip to content

Commit 8b6509c

Browse files
committed
update recipe
Signed-off-by: SumanthRH <[email protected]>
1 parent 6c35b22 commit 8b6509c

File tree

1 file changed

+8
-6
lines changed

1 file changed

+8
-6
lines changed

recipes/sky-t1-preview/recipe.py

Lines changed: 8 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -36,12 +36,12 @@
3636
SYSTEM_PROMPT = "You are a helpful and harmless assistant. You are Qwen developed by Alibaba. You should think step-by-step." # noqa: E501
3737
MAX_TOKENS = 16384
3838
# We explicitly set the target number of blocks to help tune performance.
39-
# For materialized datasets, the number of blocks determined by ray data can be small,
40-
# especially for a multi-stage pipeline like the one here.
41-
TARGET_NUM_ROWS_PER_BLOCK = 100
39+
# For materialized datasets, the number of blocks determined by ray data can be small
40+
# for a multi-stage pipeline like the one here.
41+
TARGET_NUM_ROWS_PER_BLOCK = 256
4242

4343
# Enable more detailed logging of tasks per actor
44-
ray.init(runtime_env={"env_vars": {"RAY_ENABLE_RECORD_ACTOR_TASK_LOGGING": 1}})
44+
ray.init(runtime_env={"env_vars": {"RAY_ENABLE_RECORD_ACTOR_TASK_LOGGING": "1"}})
4545

4646
# 1. Load datasets
4747
apps_ds = datasets.load_dataset(
@@ -170,9 +170,9 @@
170170
enable_prefix_caching=True,
171171
enable_chunked_prefill=True,
172172
max_num_batched_tokens=4096,
173-
tensor_parallel_size=4,
173+
tensor_parallel_size=2,
174174
),
175-
concurrency=2,
175+
concurrency=4,
176176
batch_size=128,
177177
)
178178

@@ -205,6 +205,8 @@
205205
# Each handles a batch of requests
206206
concurrency=1,
207207
batch_size=16,
208+
# Throttle QPS to avoid rate limit errors
209+
qps=5,
208210
)
209211
# define the reformatter
210212
reformatter = build_llm_processor(

0 commit comments

Comments
 (0)