Skip to content

Commit f9d0fcb

Browse files
authored
Merge pull request #165 from runpod-workers/hfix
[HF]: set default max_token size
2 parents 389fad7 + 99b952e commit f9d0fcb

File tree

1 file changed

+5
-1
lines changed

1 file changed

+5
-1
lines changed

src/utils.py

+5-1
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,11 @@ def __init__(self, job):
4444
self.max_batch_size = job.get("max_batch_size")
4545
self.apply_chat_template = job.get("apply_chat_template", False)
4646
self.use_openai_format = job.get("use_openai_format", False)
47-
self.sampling_params = SamplingParams(max_tokens=100, **job.get("sampling_params", {}))
47+
samp_param = job.get("sampling_params", {})
48+
if "max_tokens" not in samp_param:
49+
samp_param["max_tokens"] = 100
50+
self.sampling_params = SamplingParams(**samp_param)
51+
# self.sampling_params = SamplingParams(max_tokens=100, **job.get("sampling_params", {}))
4852
self.request_id = random_uuid()
4953
batch_size_growth_factor = job.get("batch_size_growth_factor")
5054
self.batch_size_growth_factor = float(batch_size_growth_factor) if batch_size_growth_factor else None

0 commit comments

Comments
 (0)