Skip to content

Commit

Permalink
Fix missing sys handling
Browse files Browse the repository at this point in the history
  • Loading branch information
Maxusmusti committed Jun 20, 2024
1 parent c27e20b commit cc556f7
Showing 1 changed file with 4 additions and 1 deletion.
5 changes: 4 additions & 1 deletion src/instructlab/training/data_process.py
Original file line number Diff line number Diff line change
Expand Up @@ -196,7 +196,10 @@ def main(args: DataProcessArgs):

eos_tk = get_sp_token(tokenizer, SPECIAL_TOKENS.eos)
pad_tk = get_sp_token(tokenizer, SPECIAL_TOKENS.pad)
system_tk = get_sp_token(tokenizer, SPECIAL_TOKENS.system)
if SPECIAL_TOKENS.system:
system_tk = get_sp_token(tokenizer, SPECIAL_TOKENS.system)
else:
system_tk = None
user_tk = get_sp_token(tokenizer, SPECIAL_TOKENS.user)
assistant_tk = get_sp_token(tokenizer, SPECIAL_TOKENS.assistant)
log_rank_0(
Expand Down

0 comments on commit cc556f7

Please sign in to comment.