We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e456b20 commit 04857dcCopy full SHA for 04857dc
src/art/preprocessing/tokenize.py
@@ -221,7 +221,15 @@ def tokenize_trajectory(
221
add_special_tokens=False,
222
)
223
token_ids[start:end] = content_token_ids
224
- logprobs[start:end] = [float("nan")] * len(content_token_ids)
+ dict_logprobs = message.get("logprobs")
225
+ if dict_logprobs is None:
226
+ logprobs[start:end] = [float("nan")] * len(content_token_ids)
227
+ elif "content" in dict_logprobs and dict_logprobs["content"]:
228
+ logprobs[start:end] = [lp["logprob"] for lp in dict_logprobs["content"]]
229
+ else:
230
+ raise ValueError(
231
+ f"Message has 'logprobs' key but content is missing or empty: {dict_logprobs}"
232
+ )
233
assistant_mask[start:end] = [1] * len(content_token_ids)
234
else:
235
choice = message
0 commit comments