File tree Expand file tree Collapse file tree 2 files changed +7
-1
lines changed Expand file tree Collapse file tree 2 files changed +7
-1
lines changed Original file line number Diff line number Diff line change @@ -543,7 +543,7 @@ def main():
543
543
model .parameters (),
544
544
weight_decay = args .weight_decay ,
545
545
lr = args .learning_rate ,
546
- betas = (0.9 , 0.95 ),
546
+ betas = (0.9 , 0.999 ),
547
547
)
548
548
# for group in optimizer.param_groups:
549
549
# group.setdefault("initial_lr", group["lr"])
Original file line number Diff line number Diff line change 8
8
from typing import List , Union
9
9
from utils .common_utils import print_rank_0
10
10
from transformers import AutoTokenizer
11
+ from tokenizer .chat_template import MFTCoder_template
11
12
12
13
13
14
def build_tokenizer (args ):
@@ -20,6 +21,11 @@ def build_tokenizer(args):
20
21
tokenizer = AutoTokenizer .from_pretrained (args .pretrained_model_path , trust_remote_code = True )
21
22
tokenizer .eod_id = tokenizer .convert_tokens_to_ids (args .eos_token )
22
23
tokenizer .pad_id = tokenizer .convert_tokens_to_ids (args .pad_token )
24
+ try :
25
+ tokenizer .eos_token = args .eos_token
26
+ tokenizer .pad_token = args .pad_token
27
+ except :
28
+ print (f"[WARNING]Cannot set tokenizer.eos_token" )
23
29
print_rank_0 (f"Tokenizer: { type (tokenizer )} " )
24
30
print_rank_0 (f"Length of tokenizer: { len (tokenizer )} " )
25
31
print_rank_0 (f"build_tokenizer PAD id: { tokenizer .pad_id } , EOD id: { tokenizer .eod_id } " )
You can’t perform that action at this time.
0 commit comments